program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3520.4.1"}, {"coremlc-version", "3520.5.1"}})] { func main(tensor cache_channel, tensor cache_len, tensor cache_time, tensor mel, tensor mel_length, tensor prompt_id) { tensor value_3_perm_0 = const()[name = tensor("value_3_perm_0"), val = tensor([1, 0, 2, 3])]; tensor cache_channel_to_fp16_dtype_0 = const()[name = tensor("cache_channel_to_fp16_dtype_0"), val = tensor("fp16")]; tensor value_5_perm_0 = const()[name = tensor("value_5_perm_0"), val = tensor([1, 0, 2, 3])]; tensor cache_time_to_fp16_dtype_0 = const()[name = tensor("cache_time_to_fp16_dtype_0"), val = tensor("fp16")]; tensor var_59 = const()[name = tensor("op_59"), val = tensor(-1)]; tensor var_68 = const()[name = tensor("op_68"), val = tensor(1)]; tensor x_1_perm_0 = const()[name = tensor("x_1_perm_0"), val = tensor([0, 2, 1])]; tensor mel_to_fp16_dtype_0 = const()[name = tensor("mel_to_fp16_dtype_0"), val = tensor("fp16")]; tensor tensor_1_axes_0 = const()[name = tensor("tensor_1_axes_0"), val = tensor([1])]; tensor mel_to_fp16 = cast(dtype = mel_to_fp16_dtype_0, x = mel)[name = tensor("cast_18")]; tensor x_1_cast_fp16 = transpose(perm = x_1_perm_0, x = mel_to_fp16)[name = tensor("transpose_367")]; tensor tensor_1_cast_fp16 = expand_dims(axes = tensor_1_axes_0, x = x_1_cast_fp16)[name = tensor("tensor_1_cast_fp16")]; tensor expand_dims_0 = const()[name = tensor("expand_dims_0"), val = tensor([[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64]])]; tensor var_137_axes_0 = const()[name = tensor("op_137_axes_0"), val = tensor([1])]; tensor var_137 = expand_dims(axes = var_137_axes_0, x = mel_length)[name = tensor("op_137")]; tensor time_mask_1 = less(x = expand_dims_0, y = var_137)[name = tensor("time_mask_1")]; tensor var_139_axes_0 = const()[name = tensor("op_139_axes_0"), val = tensor([-1])]; tensor var_139 = expand_dims(axes = var_139_axes_0, x = time_mask_1)[name = tensor("op_139")]; tensor var_141_reps_0 = const()[name = tensor("op_141_reps_0"), val = tensor([1, 1, 128])]; tensor var_141 = tile(reps = var_141_reps_0, x = var_139)[name = tensor("op_141")]; tensor var_147_axes_0 = const()[name = tensor("op_147_axes_0"), val = tensor([1])]; tensor cast_4_to_fp16_dtype_0 = const()[name = tensor("cast_4_to_fp16_dtype_0"), val = tensor("fp16")]; tensor var_141_to_fp16 = cast(dtype = cast_4_to_fp16_dtype_0, x = var_141)[name = tensor("cast_17")]; tensor var_147_cast_fp16 = expand_dims(axes = var_147_axes_0, x = var_141_to_fp16)[name = tensor("op_147_cast_fp16")]; tensor input_1_cast_fp16 = mul(x = tensor_1_cast_fp16, y = var_147_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor input_3_pad_0 = const()[name = tensor("input_3_pad_0"), val = tensor([0, 0, 0, 0, 2, 1, 2, 1])]; tensor input_3_mode_0 = const()[name = tensor("input_3_mode_0"), val = tensor("constant")]; tensor const_9_to_fp16 = const()[name = tensor("const_9_to_fp16"), val = tensor(0x0p+0)]; tensor input_3_cast_fp16 = pad(constant_val = const_9_to_fp16, mode = input_3_mode_0, pad = input_3_pad_0, x = input_1_cast_fp16)[name = tensor("input_3_cast_fp16")]; tensor tensor_3_pad_type_0 = const()[name = tensor("tensor_3_pad_type_0"), val = tensor("valid")]; tensor tensor_3_strides_0 = const()[name = tensor("tensor_3_strides_0"), val = tensor([2, 2])]; tensor tensor_3_pad_0 = const()[name = tensor("tensor_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor tensor_3_dilations_0 = const()[name = tensor("tensor_3_dilations_0"), val = tensor([1, 1])]; tensor tensor_3_groups_0 = const()[name = tensor("tensor_3_groups_0"), val = tensor(1)]; tensor encoder_pre_encode_conv_0_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_pre_encode_conv_0_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2752))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2432)))]; tensor encoder_pre_encode_conv_0_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3328)))]; tensor tensor_3_cast_fp16 = conv(bias = encoder_pre_encode_conv_0_bias_to_fp16, dilations = tensor_3_dilations_0, groups = tensor_3_groups_0, pad = tensor_3_pad_0, pad_type = tensor_3_pad_type_0, strides = tensor_3_strides_0, weight = encoder_pre_encode_conv_0_weight_to_fp16_quantized, x = input_3_cast_fp16)[name = tensor("tensor_3_cast_fp16")]; tensor cast_2_to_fp16_dtype_0 = const()[name = tensor("cast_2_to_fp16_dtype_0"), val = tensor("fp16")]; tensor var_160_promoted_to_fp16 = const()[name = tensor("op_160_promoted_to_fp16"), val = tensor(0x1p+1)]; tensor mel_length_to_fp16 = cast(dtype = cast_2_to_fp16_dtype_0, x = mel_length)[name = tensor("cast_16")]; tensor var_161_cast_fp16 = add(x = mel_length_to_fp16, y = var_160_promoted_to_fp16)[name = tensor("op_161_cast_fp16")]; tensor var_162_promoted_to_fp16 = const()[name = tensor("op_162_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor var_163_cast_fp16 = add(x = var_161_cast_fp16, y = var_162_promoted_to_fp16)[name = tensor("op_163_cast_fp16")]; tensor var_164_promoted_to_fp16 = const()[name = tensor("op_164_promoted_to_fp16"), val = tensor(0x1.8p+1)]; tensor var_165_cast_fp16 = sub(x = var_163_cast_fp16, y = var_164_promoted_to_fp16)[name = tensor("op_165_cast_fp16")]; tensor var_56_promoted_to_fp16 = const()[name = tensor("op_56_promoted_to_fp16"), val = tensor(0x1p+1)]; tensor floor_div_0_cast_fp16 = floor_div(x = var_165_cast_fp16, y = var_56_promoted_to_fp16)[name = tensor("floor_div_0_cast_fp16")]; tensor var_167_promoted_to_fp16 = const()[name = tensor("op_167_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor current_lengths_3_cast_fp16 = add(x = floor_div_0_cast_fp16, y = var_167_promoted_to_fp16)[name = tensor("current_lengths_3_cast_fp16")]; tensor cast_5_dtype_0 = const()[name = tensor("cast_5_dtype_0"), val = tensor("int32")]; tensor expand_dims_1 = const()[name = tensor("expand_dims_1"), val = tensor([[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32]])]; tensor var_176_axes_0 = const()[name = tensor("op_176_axes_0"), val = tensor([1])]; tensor current_lengths_3_cast_fp16_to_int32 = cast(dtype = cast_5_dtype_0, x = current_lengths_3_cast_fp16)[name = tensor("cast_15")]; tensor var_176 = expand_dims(axes = var_176_axes_0, x = current_lengths_3_cast_fp16_to_int32)[name = tensor("op_176")]; tensor time_mask_3 = less(x = expand_dims_1, y = var_176)[name = tensor("time_mask_3")]; tensor var_178_axes_0 = const()[name = tensor("op_178_axes_0"), val = tensor([-1])]; tensor var_178 = expand_dims(axes = var_178_axes_0, x = time_mask_3)[name = tensor("op_178")]; tensor var_180_reps_0 = const()[name = tensor("op_180_reps_0"), val = tensor([1, 1, 65])]; tensor var_180 = tile(reps = var_180_reps_0, x = var_178)[name = tensor("op_180")]; tensor var_186_axes_0 = const()[name = tensor("op_186_axes_0"), val = tensor([1])]; tensor cast_6_to_fp16_dtype_0 = const()[name = tensor("cast_6_to_fp16_dtype_0"), val = tensor("fp16")]; tensor var_180_to_fp16 = cast(dtype = cast_6_to_fp16_dtype_0, x = var_180)[name = tensor("cast_14")]; tensor var_186_cast_fp16 = expand_dims(axes = var_186_axes_0, x = var_180_to_fp16)[name = tensor("op_186_cast_fp16")]; tensor expanded_mask_3_reps_0 = const()[name = tensor("expanded_mask_3_reps_0"), val = tensor([1, 256, 1, 1])]; tensor expanded_mask_3_cast_fp16 = tile(reps = expanded_mask_3_reps_0, x = var_186_cast_fp16)[name = tensor("expanded_mask_3_cast_fp16")]; tensor input_5_cast_fp16 = mul(x = tensor_3_cast_fp16, y = expanded_mask_3_cast_fp16)[name = tensor("input_5_cast_fp16")]; tensor tensor_5_cast_fp16 = relu(x = input_5_cast_fp16)[name = tensor("tensor_5_cast_fp16")]; tensor input_7_cast_fp16 = mul(x = tensor_5_cast_fp16, y = expanded_mask_3_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor input_9_pad_0 = const()[name = tensor("input_9_pad_0"), val = tensor([0, 0, 0, 0, 2, 1, 2, 1])]; tensor input_9_mode_0 = const()[name = tensor("input_9_mode_0"), val = tensor("constant")]; tensor const_23_to_fp16 = const()[name = tensor("const_23_to_fp16"), val = tensor(0x0p+0)]; tensor input_9_cast_fp16 = pad(constant_val = const_23_to_fp16, mode = input_9_mode_0, pad = input_9_pad_0, x = input_7_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor tensor_7_pad_type_0 = const()[name = tensor("tensor_7_pad_type_0"), val = tensor("valid")]; tensor tensor_7_strides_0 = const()[name = tensor("tensor_7_strides_0"), val = tensor([2, 2])]; tensor tensor_7_groups_0 = const()[name = tensor("tensor_7_groups_0"), val = tensor(256)]; tensor tensor_7_pad_0 = const()[name = tensor("tensor_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor tensor_7_dilations_0 = const()[name = tensor("tensor_7_dilations_0"), val = tensor([1, 1])]; tensor encoder_pre_encode_conv_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_pre_encode_conv_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3904))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6272))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2432)))]; tensor encoder_pre_encode_conv_2_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6848)))]; tensor tensor_7_cast_fp16 = conv(bias = encoder_pre_encode_conv_2_bias_to_fp16, dilations = tensor_7_dilations_0, groups = tensor_7_groups_0, pad = tensor_7_pad_0, pad_type = tensor_7_pad_type_0, strides = tensor_7_strides_0, weight = encoder_pre_encode_conv_2_weight_to_fp16_quantized, x = input_9_cast_fp16)[name = tensor("tensor_7_cast_fp16")]; tensor var_208_promoted_to_fp16 = const()[name = tensor("op_208_promoted_to_fp16"), val = tensor(0x1p+1)]; tensor var_209_cast_fp16 = add(x = current_lengths_3_cast_fp16, y = var_208_promoted_to_fp16)[name = tensor("op_209_cast_fp16")]; tensor var_210_promoted_to_fp16 = const()[name = tensor("op_210_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor var_211_cast_fp16 = add(x = var_209_cast_fp16, y = var_210_promoted_to_fp16)[name = tensor("op_211_cast_fp16")]; tensor var_212_promoted_to_fp16 = const()[name = tensor("op_212_promoted_to_fp16"), val = tensor(0x1.8p+1)]; tensor var_213_cast_fp16 = sub(x = var_211_cast_fp16, y = var_212_promoted_to_fp16)[name = tensor("op_213_cast_fp16")]; tensor var_56_promoted_1_to_fp16 = const()[name = tensor("op_56_promoted_1_to_fp16"), val = tensor(0x1p+1)]; tensor floor_div_1_cast_fp16 = floor_div(x = var_213_cast_fp16, y = var_56_promoted_1_to_fp16)[name = tensor("floor_div_1_cast_fp16")]; tensor var_215_promoted_to_fp16 = const()[name = tensor("op_215_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor current_lengths_5_cast_fp16 = add(x = floor_div_1_cast_fp16, y = var_215_promoted_to_fp16)[name = tensor("current_lengths_5_cast_fp16")]; tensor cast_7_dtype_0 = const()[name = tensor("cast_7_dtype_0"), val = tensor("int32")]; tensor expand_dims_2 = const()[name = tensor("expand_dims_2"), val = tensor([[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16]])]; tensor var_224_axes_0 = const()[name = tensor("op_224_axes_0"), val = tensor([1])]; tensor current_lengths_5_cast_fp16_to_int32 = cast(dtype = cast_7_dtype_0, x = current_lengths_5_cast_fp16)[name = tensor("cast_13")]; tensor var_224 = expand_dims(axes = var_224_axes_0, x = current_lengths_5_cast_fp16_to_int32)[name = tensor("op_224")]; tensor time_mask_5 = less(x = expand_dims_2, y = var_224)[name = tensor("time_mask_5")]; tensor var_226_axes_0 = const()[name = tensor("op_226_axes_0"), val = tensor([-1])]; tensor var_226 = expand_dims(axes = var_226_axes_0, x = time_mask_5)[name = tensor("op_226")]; tensor var_228_reps_0 = const()[name = tensor("op_228_reps_0"), val = tensor([1, 1, 33])]; tensor var_228 = tile(reps = var_228_reps_0, x = var_226)[name = tensor("op_228")]; tensor var_234_axes_0 = const()[name = tensor("op_234_axes_0"), val = tensor([1])]; tensor cast_8_to_fp16_dtype_0 = const()[name = tensor("cast_8_to_fp16_dtype_0"), val = tensor("fp16")]; tensor var_228_to_fp16 = cast(dtype = cast_8_to_fp16_dtype_0, x = var_228)[name = tensor("cast_12")]; tensor var_234_cast_fp16 = expand_dims(axes = var_234_axes_0, x = var_228_to_fp16)[name = tensor("op_234_cast_fp16")]; tensor expanded_mask_7_reps_0 = const()[name = tensor("expanded_mask_7_reps_0"), val = tensor([1, 256, 1, 1])]; tensor expanded_mask_7_cast_fp16 = tile(reps = expanded_mask_7_reps_0, x = var_234_cast_fp16)[name = tensor("expanded_mask_7_cast_fp16")]; tensor input_11_cast_fp16 = mul(x = tensor_7_cast_fp16, y = expanded_mask_7_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor tensor_9_pad_type_0 = const()[name = tensor("tensor_9_pad_type_0"), val = tensor("valid")]; tensor tensor_9_strides_0 = const()[name = tensor("tensor_9_strides_0"), val = tensor([1, 1])]; tensor tensor_9_pad_0 = const()[name = tensor("tensor_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor tensor_9_dilations_0 = const()[name = tensor("tensor_9_dilations_0"), val = tensor([1, 1])]; tensor tensor_9_groups_0 = const()[name = tensor("tensor_9_groups_0"), val = tensor(1)]; tensor encoder_pre_encode_conv_3_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_pre_encode_conv_3_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7424))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(73024))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2432)))]; tensor encoder_pre_encode_conv_3_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(73600)))]; tensor tensor_9_cast_fp16 = conv(bias = encoder_pre_encode_conv_3_bias_to_fp16, dilations = tensor_9_dilations_0, groups = tensor_9_groups_0, pad = tensor_9_pad_0, pad_type = tensor_9_pad_type_0, strides = tensor_9_strides_0, weight = encoder_pre_encode_conv_3_weight_to_fp16_quantized, x = input_11_cast_fp16)[name = tensor("tensor_9_cast_fp16")]; tensor input_13_cast_fp16 = mul(x = tensor_9_cast_fp16, y = expanded_mask_7_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor tensor_11_cast_fp16 = relu(x = input_13_cast_fp16)[name = tensor("tensor_11_cast_fp16")]; tensor input_15_cast_fp16 = mul(x = tensor_11_cast_fp16, y = expanded_mask_7_cast_fp16)[name = tensor("input_15_cast_fp16")]; tensor input_17_pad_0 = const()[name = tensor("input_17_pad_0"), val = tensor([0, 0, 0, 0, 2, 1, 2, 1])]; tensor input_17_mode_0 = const()[name = tensor("input_17_mode_0"), val = tensor("constant")]; tensor const_41_to_fp16 = const()[name = tensor("const_41_to_fp16"), val = tensor(0x0p+0)]; tensor input_17_cast_fp16 = pad(constant_val = const_41_to_fp16, mode = input_17_mode_0, pad = input_17_pad_0, x = input_15_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor tensor_13_pad_type_0 = const()[name = tensor("tensor_13_pad_type_0"), val = tensor("valid")]; tensor tensor_13_strides_0 = const()[name = tensor("tensor_13_strides_0"), val = tensor([2, 2])]; tensor tensor_13_groups_0 = const()[name = tensor("tensor_13_groups_0"), val = tensor(256)]; tensor tensor_13_pad_0 = const()[name = tensor("tensor_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor tensor_13_dilations_0 = const()[name = tensor("tensor_13_dilations_0"), val = tensor([1, 1])]; tensor encoder_pre_encode_conv_5_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_pre_encode_conv_5_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74176))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76544))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2432)))]; tensor encoder_pre_encode_conv_5_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_5_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77120)))]; tensor tensor_13_cast_fp16 = conv(bias = encoder_pre_encode_conv_5_bias_to_fp16, dilations = tensor_13_dilations_0, groups = tensor_13_groups_0, pad = tensor_13_pad_0, pad_type = tensor_13_pad_type_0, strides = tensor_13_strides_0, weight = encoder_pre_encode_conv_5_weight_to_fp16_quantized, x = input_17_cast_fp16)[name = tensor("tensor_13_cast_fp16")]; tensor var_271_promoted_to_fp16 = const()[name = tensor("op_271_promoted_to_fp16"), val = tensor(0x1p+1)]; tensor var_272_cast_fp16 = add(x = current_lengths_5_cast_fp16, y = var_271_promoted_to_fp16)[name = tensor("op_272_cast_fp16")]; tensor var_273_promoted_to_fp16 = const()[name = tensor("op_273_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor var_274_cast_fp16 = add(x = var_272_cast_fp16, y = var_273_promoted_to_fp16)[name = tensor("op_274_cast_fp16")]; tensor var_275_promoted_to_fp16 = const()[name = tensor("op_275_promoted_to_fp16"), val = tensor(0x1.8p+1)]; tensor var_276_cast_fp16 = sub(x = var_274_cast_fp16, y = var_275_promoted_to_fp16)[name = tensor("op_276_cast_fp16")]; tensor var_56_promoted_2_to_fp16 = const()[name = tensor("op_56_promoted_2_to_fp16"), val = tensor(0x1p+1)]; tensor floor_div_2_cast_fp16 = floor_div(x = var_276_cast_fp16, y = var_56_promoted_2_to_fp16)[name = tensor("floor_div_2_cast_fp16")]; tensor var_278_promoted_to_fp16 = const()[name = tensor("op_278_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor current_lengths_cast_fp16 = add(x = floor_div_2_cast_fp16, y = var_278_promoted_to_fp16)[name = tensor("current_lengths_cast_fp16")]; tensor cast_9_dtype_0 = const()[name = tensor("cast_9_dtype_0"), val = tensor("int32")]; tensor expand_dims_3 = const()[name = tensor("expand_dims_3"), val = tensor([[0, 1, 2, 3, 4, 5, 6, 7, 8]])]; tensor var_287_axes_0 = const()[name = tensor("op_287_axes_0"), val = tensor([1])]; tensor current_lengths_cast_fp16_to_int32 = cast(dtype = cast_9_dtype_0, x = current_lengths_cast_fp16)[name = tensor("cast_11")]; tensor var_287 = expand_dims(axes = var_287_axes_0, x = current_lengths_cast_fp16_to_int32)[name = tensor("op_287")]; tensor time_mask = less(x = expand_dims_3, y = var_287)[name = tensor("time_mask")]; tensor var_289_axes_0 = const()[name = tensor("op_289_axes_0"), val = tensor([-1])]; tensor var_289 = expand_dims(axes = var_289_axes_0, x = time_mask)[name = tensor("op_289")]; tensor var_291_reps_0 = const()[name = tensor("op_291_reps_0"), val = tensor([1, 1, 17])]; tensor var_291 = tile(reps = var_291_reps_0, x = var_289)[name = tensor("op_291")]; tensor var_297_axes_0 = const()[name = tensor("op_297_axes_0"), val = tensor([1])]; tensor cast_10_to_fp16_dtype_0 = const()[name = tensor("cast_10_to_fp16_dtype_0"), val = tensor("fp16")]; tensor var_291_to_fp16 = cast(dtype = cast_10_to_fp16_dtype_0, x = var_291)[name = tensor("cast_10")]; tensor var_297_cast_fp16 = expand_dims(axes = var_297_axes_0, x = var_291_to_fp16)[name = tensor("op_297_cast_fp16")]; tensor expanded_mask_13_reps_0 = const()[name = tensor("expanded_mask_13_reps_0"), val = tensor([1, 256, 1, 1])]; tensor expanded_mask_13_cast_fp16 = tile(reps = expanded_mask_13_reps_0, x = var_297_cast_fp16)[name = tensor("expanded_mask_13_cast_fp16")]; tensor input_19_cast_fp16 = mul(x = tensor_13_cast_fp16, y = expanded_mask_13_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor tensor_15_pad_type_0 = const()[name = tensor("tensor_15_pad_type_0"), val = tensor("valid")]; tensor tensor_15_strides_0 = const()[name = tensor("tensor_15_strides_0"), val = tensor([1, 1])]; tensor tensor_15_pad_0 = const()[name = tensor("tensor_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor tensor_15_dilations_0 = const()[name = tensor("tensor_15_dilations_0"), val = tensor([1, 1])]; tensor tensor_15_groups_0 = const()[name = tensor("tensor_15_groups_0"), val = tensor(1)]; tensor encoder_pre_encode_conv_6_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_pre_encode_conv_6_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77696))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143296))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2432)))]; tensor encoder_pre_encode_conv_6_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_6_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143872)))]; tensor tensor_15_cast_fp16 = conv(bias = encoder_pre_encode_conv_6_bias_to_fp16, dilations = tensor_15_dilations_0, groups = tensor_15_groups_0, pad = tensor_15_pad_0, pad_type = tensor_15_pad_type_0, strides = tensor_15_strides_0, weight = encoder_pre_encode_conv_6_weight_to_fp16_quantized, x = input_19_cast_fp16)[name = tensor("tensor_15_cast_fp16")]; tensor input_21_cast_fp16 = mul(x = tensor_15_cast_fp16, y = expanded_mask_13_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor tensor_cast_fp16 = relu(x = input_21_cast_fp16)[name = tensor("tensor_cast_fp16")]; tensor x_3_cast_fp16 = mul(x = tensor_cast_fp16, y = expanded_mask_13_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor var_331_perm_0 = const()[name = tensor("op_331_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_332 = const()[name = tensor("op_332"), val = tensor([1, 9, -1])]; tensor var_331_cast_fp16 = transpose(perm = var_331_perm_0, x = x_3_cast_fp16)[name = tensor("transpose_366")]; tensor input_23_cast_fp16 = reshape(shape = var_332, x = var_331_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor encoder_pre_encode_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_pre_encode_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144448))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4602048))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_pre_encode_out_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4604160)))]; tensor linear_0_cast_fp16 = linear(bias = encoder_pre_encode_out_bias_to_fp16, weight = encoder_pre_encode_out_weight_to_fp16_quantized, x = input_23_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor var_342_begin_0 = const()[name = tensor("op_342_begin_0"), val = tensor([0, 2, 0])]; tensor var_342_end_0 = const()[name = tensor("op_342_end_0"), val = tensor([1, 9, 1024])]; tensor var_342_end_mask_0 = const()[name = tensor("op_342_end_mask_0"), val = tensor([true, true, true])]; tensor var_342_cast_fp16 = slice_by_index(begin = var_342_begin_0, end = var_342_end_0, end_mask = var_342_end_mask_0, x = linear_0_cast_fp16)[name = tensor("op_342_cast_fp16")]; tensor var_344 = const()[name = tensor("op_344"), val = tensor(2)]; tensor var_345 = sub(x = current_lengths_cast_fp16_to_int32, y = var_344)[name = tensor("op_345")]; tensor var_345_promoted_to_fp16_dtype_0 = const()[name = tensor("op_345_promoted_to_fp16_dtype_0"), val = tensor("fp16")]; tensor var_62_promoted_to_fp16 = const()[name = tensor("op_62_promoted_to_fp16"), val = tensor(0x0p+0)]; tensor const_61_to_fp16 = const()[name = tensor("const_61_to_fp16"), val = tensor(inf)]; tensor var_345_to_fp16 = cast(dtype = var_345_promoted_to_fp16_dtype_0, x = var_345)[name = tensor("cast_9")]; tensor clip_0_cast_fp16 = clip(alpha = var_62_promoted_to_fp16, beta = const_61_to_fp16, x = var_345_to_fp16)[name = tensor("clip_0_cast_fp16")]; tensor max_audio_length_1 = const()[name = tensor("max_audio_length_1"), val = tensor([7])]; tensor var_361_promoted_to_fp16 = const()[name = tensor("op_361_promoted_to_fp16"), val = tensor(0x1.5p+5)]; tensor padding_length_cast_fp16 = add(x = clip_0_cast_fp16, y = var_361_promoted_to_fp16)[name = tensor("padding_length_cast_fp16")]; tensor const_63 = const()[name = tensor("const_63"), val = tensor(-1)]; tensor var_363 = mul(x = cache_len, y = const_63)[name = tensor("op_363")]; tensor var_364 = const()[name = tensor("op_364"), val = tensor(42)]; tensor offset = add(x = var_363, y = var_364)[name = tensor("offset")]; tensor var_404_axes_0 = const()[name = tensor("op_404_axes_0"), val = tensor([-1])]; tensor var_404_cast_fp16 = expand_dims(axes = var_404_axes_0, x = padding_length_cast_fp16)[name = tensor("op_404_cast_fp16")]; tensor var_403_promoted_to_fp16 = const()[name = tensor("op_403_promoted_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4606272)))]; tensor pad_mask_1_cast_fp16 = less(x = var_403_promoted_to_fp16, y = var_404_cast_fp16)[name = tensor("pad_mask_1_cast_fp16")]; tensor expand_dims_5 = const()[name = tensor("expand_dims_5"), val = tensor([[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48]])]; tensor var_410_axes_0 = const()[name = tensor("op_410_axes_0"), val = tensor([-1])]; tensor var_410 = expand_dims(axes = var_410_axes_0, x = offset)[name = tensor("op_410")]; tensor pad_mask_off = greater_equal(x = expand_dims_5, y = var_410)[name = tensor("pad_mask_off")]; tensor pad_mask_3 = logical_and(x = pad_mask_off, y = pad_mask_1_cast_fp16)[name = tensor("pad_mask_3")]; tensor var_413_axes_0 = const()[name = tensor("op_413_axes_0"), val = tensor([1])]; tensor var_413 = expand_dims(axes = var_413_axes_0, x = pad_mask_3)[name = tensor("op_413")]; tensor var_414 = const()[name = tensor("op_414"), val = tensor([1, 49, 1])]; tensor pad_mask_for_att_mask_1 = tile(reps = var_414, x = var_413)[name = tensor("pad_mask_for_att_mask_1")]; tensor var_416_perm_0 = const()[name = tensor("op_416_perm_0"), val = tensor([0, 2, 1])]; tensor var_416 = transpose(perm = var_416_perm_0, x = pad_mask_for_att_mask_1)[name = tensor("transpose_365")]; tensor pad_mask_for_att_mask = logical_and(x = pad_mask_for_att_mask_1, y = var_416)[name = tensor("pad_mask_for_att_mask")]; tensor const_71 = const()[name = tensor("const_71"), val = tensor([[[true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true]]])]; tensor att_mask_9 = logical_and(x = pad_mask_for_att_mask, y = const_71)[name = tensor("att_mask_9")]; tensor att_mask = logical_not(x = att_mask_9)[name = tensor("att_mask")]; tensor pad_mask_5 = logical_not(x = pad_mask_3)[name = tensor("pad_mask_5")]; tensor pad_mask_begin_0 = const()[name = tensor("pad_mask_begin_0"), val = tensor([0, 42])]; tensor pad_mask_end_0 = const()[name = tensor("pad_mask_end_0"), val = tensor([1, 49])]; tensor pad_mask_end_mask_0 = const()[name = tensor("pad_mask_end_mask_0"), val = tensor([true, true])]; tensor pad_mask = slice_by_index(begin = pad_mask_begin_0, end = pad_mask_end_0, end_mask = pad_mask_end_mask_0, x = pad_mask_5)[name = tensor("pad_mask")]; tensor mask_9_begin_0 = const()[name = tensor("mask_9_begin_0"), val = tensor([0, 42, 0])]; tensor mask_9_end_0 = const()[name = tensor("mask_9_end_0"), val = tensor([1, 49, 49])]; tensor mask_9_end_mask_0 = const()[name = tensor("mask_9_end_mask_0"), val = tensor([true, true, true])]; tensor mask_9 = slice_by_index(begin = mask_9_begin_0, end = mask_9_end_0, end_mask = mask_9_end_mask_0, x = att_mask)[name = tensor("mask_9")]; tensor cache_1_begin_0 = const()[name = tensor("cache_1_begin_0"), val = tensor([0, 0, 0, 0])]; tensor cache_1_end_0 = const()[name = tensor("cache_1_end_0"), val = tensor([1, 1, 42, 1024])]; tensor cache_1_end_mask_0 = const()[name = tensor("cache_1_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_1_squeeze_mask_0 = const()[name = tensor("cache_1_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_channel_to_fp16 = cast(dtype = cache_channel_to_fp16_dtype_0, x = cache_channel)[name = tensor("cast_8")]; tensor value_3_cast_fp16 = transpose(perm = value_3_perm_0, x = cache_channel_to_fp16)[name = tensor("transpose_364")]; tensor cache_1_cast_fp16 = slice_by_index(begin = cache_1_begin_0, end = cache_1_end_0, end_mask = cache_1_end_mask_0, squeeze_mask = cache_1_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_1_cast_fp16")]; tensor cache_3_begin_0 = const()[name = tensor("cache_3_begin_0"), val = tensor([0, 0, 0, 0])]; tensor cache_3_end_0 = const()[name = tensor("cache_3_end_0"), val = tensor([1, 1, 1024, 8])]; tensor cache_3_end_mask_0 = const()[name = tensor("cache_3_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_3_squeeze_mask_0 = const()[name = tensor("cache_3_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_time_to_fp16 = cast(dtype = cache_time_to_fp16_dtype_0, x = cache_time)[name = tensor("cast_7")]; tensor value_5_cast_fp16 = transpose(perm = value_5_perm_0, x = cache_time_to_fp16)[name = tensor("transpose_363")]; tensor cache_3_cast_fp16 = slice_by_index(begin = cache_3_begin_0, end = cache_3_end_0, end_mask = cache_3_end_mask_0, squeeze_mask = cache_3_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_3_cast_fp16")]; tensor input_27_axes_0 = const()[name = tensor("input_27_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4606464)))]; tensor encoder_layers_0_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4608576)))]; tensor var_42_to_fp16 = const()[name = tensor("op_42_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_27_cast_fp16 = layer_norm(axes = input_27_axes_0, beta = encoder_layers_0_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_0_norm_feed_forward1_weight_to_fp16, x = var_342_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor encoder_layers_0_feed_forward1_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_feed_forward1_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4610688))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8809216))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_0_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_0_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8817472)))]; tensor linear_1_cast_fp16 = linear(bias = encoder_layers_0_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_0_feed_forward1_linear1_weight_to_fp16_quantized, x = input_27_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor input_31_cast_fp16 = silu(x = linear_1_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor encoder_layers_0_feed_forward1_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_feed_forward1_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8825728))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13020096))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_0_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_0_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13022208)))]; tensor linear_2_cast_fp16 = linear(bias = encoder_layers_0_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_0_feed_forward1_linear2_weight_to_fp16_quantized, x = input_31_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor var_455_to_fp16 = const()[name = tensor("op_455_to_fp16"), val = tensor(0x1p-1)]; tensor var_456_cast_fp16 = mul(x = linear_2_cast_fp16, y = var_455_to_fp16)[name = tensor("op_456_cast_fp16")]; tensor input_37_cast_fp16 = add(x = var_342_cast_fp16, y = var_456_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor key_1_axes_0 = const()[name = tensor("key_1_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13024320)))]; tensor encoder_layers_0_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13026432)))]; tensor key_1_cast_fp16 = layer_norm(axes = key_1_axes_0, beta = encoder_layers_0_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_0_norm_self_att_weight_to_fp16, x = input_37_cast_fp16)[name = tensor("key_1_cast_fp16")]; tensor input_39_interleave_0 = const()[name = tensor("input_39_interleave_0"), val = tensor(false)]; tensor input_39_cast_fp16 = concat(axis = var_68, interleave = input_39_interleave_0, values = (cache_1_cast_fp16, key_1_cast_fp16))[name = tensor("input_39_cast_fp16")]; tensor var_478_begin_0 = const()[name = tensor("op_478_begin_0"), val = tensor([0, 7, 0])]; tensor var_478_end_0 = const()[name = tensor("op_478_end_0"), val = tensor([1, 42, 1024])]; tensor var_478_end_mask_0 = const()[name = tensor("op_478_end_mask_0"), val = tensor([true, true, true])]; tensor var_478_cast_fp16 = slice_by_index(begin = var_478_begin_0, end = var_478_end_0, end_mask = var_478_end_mask_0, x = cache_1_cast_fp16)[name = tensor("op_478_cast_fp16")]; tensor var_484_interleave_0 = const()[name = tensor("op_484_interleave_0"), val = tensor(false)]; tensor var_484_cast_fp16 = concat(axis = var_68, interleave = var_484_interleave_0, values = (var_478_cast_fp16, key_1_cast_fp16))[name = tensor("op_484_cast_fp16")]; tensor encoder_layers_0_self_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_self_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13028544))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14077184))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_0_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14079296)))]; tensor linear_3_cast_fp16 = linear(bias = encoder_layers_0_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_0_self_attn_linear_q_weight_to_fp16_quantized, x = key_1_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor var_489 = const()[name = tensor("op_489"), val = tensor([1, -1, 8, 128])]; tensor q_1_cast_fp16 = reshape(shape = var_489, x = linear_3_cast_fp16)[name = tensor("q_1_cast_fp16")]; tensor encoder_layers_0_self_attn_linear_k_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_self_attn_linear_k_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14081408))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15130048))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_0_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15132160)))]; tensor linear_4_cast_fp16 = linear(bias = encoder_layers_0_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_0_self_attn_linear_k_weight_to_fp16_quantized, x = input_39_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor var_494 = const()[name = tensor("op_494"), val = tensor([1, -1, 8, 128])]; tensor k_1_cast_fp16 = reshape(shape = var_494, x = linear_4_cast_fp16)[name = tensor("k_1_cast_fp16")]; tensor encoder_layers_0_self_attn_linear_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_self_attn_linear_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15134272))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16182912))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_0_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16185024)))]; tensor linear_5_cast_fp16 = linear(bias = encoder_layers_0_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_0_self_attn_linear_v_weight_to_fp16_quantized, x = input_39_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor var_499 = const()[name = tensor("op_499"), val = tensor([1, -1, 8, 128])]; tensor v_1_cast_fp16 = reshape(shape = var_499, x = linear_5_cast_fp16)[name = tensor("v_1_cast_fp16")]; tensor value_9_perm_0 = const()[name = tensor("value_9_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_0_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16187136)))]; tensor var_512_cast_fp16 = add(x = q_1_cast_fp16, y = encoder_layers_0_self_attn_pos_bias_u_to_fp16)[name = tensor("op_512_cast_fp16")]; tensor encoder_layers_0_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16189248)))]; tensor var_514_cast_fp16 = add(x = q_1_cast_fp16, y = encoder_layers_0_self_attn_pos_bias_v_to_fp16)[name = tensor("op_514_cast_fp16")]; tensor q_with_bias_v_1_perm_0 = const()[name = tensor("q_with_bias_v_1_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_7_transpose_x_0 = const()[name = tensor("x_7_transpose_x_0"), val = tensor(false)]; tensor x_7_transpose_y_0 = const()[name = tensor("x_7_transpose_y_0"), val = tensor(false)]; tensor op_516_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_516_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16191360))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16290944))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16290752)))]; tensor q_with_bias_v_1_cast_fp16 = transpose(perm = q_with_bias_v_1_perm_0, x = var_514_cast_fp16)[name = tensor("transpose_362")]; tensor x_7_cast_fp16 = matmul(transpose_x = x_7_transpose_x_0, transpose_y = x_7_transpose_y_0, x = q_with_bias_v_1_cast_fp16, y = op_516_to_fp16_quantized)[name = tensor("x_7_cast_fp16")]; tensor x_9_pad_0 = const()[name = tensor("x_9_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_9_mode_0 = const()[name = tensor("x_9_mode_0"), val = tensor("constant")]; tensor const_79_to_fp16 = const()[name = tensor("const_79_to_fp16"), val = tensor(0x0p+0)]; tensor x_9_cast_fp16 = pad(constant_val = const_79_to_fp16, mode = x_9_mode_0, pad = x_9_pad_0, x = x_7_cast_fp16)[name = tensor("x_9_cast_fp16")]; tensor var_524 = const()[name = tensor("op_524"), val = tensor([1, 8, -1, 7])]; tensor x_11_cast_fp16 = reshape(shape = var_524, x = x_9_cast_fp16)[name = tensor("x_11_cast_fp16")]; tensor var_528_begin_0 = const()[name = tensor("op_528_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_528_end_0 = const()[name = tensor("op_528_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_528_end_mask_0 = const()[name = tensor("op_528_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_528_cast_fp16 = slice_by_index(begin = var_528_begin_0, end = var_528_end_0, end_mask = var_528_end_mask_0, x = x_11_cast_fp16)[name = tensor("op_528_cast_fp16")]; tensor var_529 = const()[name = tensor("op_529"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_1_cast_fp16 = reshape(shape = var_529, x = var_528_cast_fp16)[name = tensor("matrix_bd_1_cast_fp16")]; tensor matrix_ac_1_transpose_x_0 = const()[name = tensor("matrix_ac_1_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_1_transpose_y_0 = const()[name = tensor("matrix_ac_1_transpose_y_0"), val = tensor(false)]; tensor transpose_96_perm_0 = const()[name = tensor("transpose_96_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_97_perm_0 = const()[name = tensor("transpose_97_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_97 = transpose(perm = transpose_97_perm_0, x = k_1_cast_fp16)[name = tensor("transpose_360")]; tensor transpose_96 = transpose(perm = transpose_96_perm_0, x = var_512_cast_fp16)[name = tensor("transpose_361")]; tensor matrix_ac_1_cast_fp16 = matmul(transpose_x = matrix_ac_1_transpose_x_0, transpose_y = matrix_ac_1_transpose_y_0, x = transpose_96, y = transpose_97)[name = tensor("matrix_ac_1_cast_fp16")]; tensor matrix_bd_3_begin_0 = const()[name = tensor("matrix_bd_3_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_3_end_0 = const()[name = tensor("matrix_bd_3_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_3_end_mask_0 = const()[name = tensor("matrix_bd_3_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_3_cast_fp16 = slice_by_index(begin = matrix_bd_3_begin_0, end = matrix_bd_3_end_0, end_mask = matrix_bd_3_end_mask_0, x = matrix_bd_1_cast_fp16)[name = tensor("matrix_bd_3_cast_fp16")]; tensor var_538_cast_fp16 = add(x = matrix_ac_1_cast_fp16, y = matrix_bd_3_cast_fp16)[name = tensor("op_538_cast_fp16")]; tensor _inversed_scores_1_y_0_to_fp16 = const()[name = tensor("_inversed_scores_1_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_1_cast_fp16 = mul(x = var_538_cast_fp16, y = _inversed_scores_1_y_0_to_fp16)[name = tensor("_inversed_scores_1_cast_fp16")]; tensor mask_11_axes_0 = const()[name = tensor("mask_11_axes_0"), val = tensor([1])]; tensor mask_11 = expand_dims(axes = mask_11_axes_0, x = mask_9)[name = tensor("mask_11")]; tensor var_45_to_fp16 = const()[name = tensor("op_45_to_fp16"), val = tensor(-0x1.388p+13)]; tensor scores_3_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_1_cast_fp16, cond = mask_11)[name = tensor("scores_3_cast_fp16")]; tensor var_544_cast_fp16 = softmax(axis = var_59, x = scores_3_cast_fp16)[name = tensor("op_544_cast_fp16")]; tensor var_44_to_fp16 = const()[name = tensor("op_44_to_fp16"), val = tensor(0x0p+0)]; tensor input_41_cast_fp16 = select(a = var_44_to_fp16, b = var_544_cast_fp16, cond = mask_11)[name = tensor("input_41_cast_fp16")]; tensor x_13_transpose_x_0 = const()[name = tensor("x_13_transpose_x_0"), val = tensor(false)]; tensor x_13_transpose_y_0 = const()[name = tensor("x_13_transpose_y_0"), val = tensor(false)]; tensor value_9_cast_fp16 = transpose(perm = value_9_perm_0, x = v_1_cast_fp16)[name = tensor("transpose_359")]; tensor x_13_cast_fp16 = matmul(transpose_x = x_13_transpose_x_0, transpose_y = x_13_transpose_y_0, x = input_41_cast_fp16, y = value_9_cast_fp16)[name = tensor("x_13_cast_fp16")]; tensor var_548_perm_0 = const()[name = tensor("op_548_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_549 = const()[name = tensor("op_549"), val = tensor([1, -1, 1024])]; tensor var_548_cast_fp16 = transpose(perm = var_548_perm_0, x = x_13_cast_fp16)[name = tensor("transpose_358")]; tensor input_43_cast_fp16 = reshape(shape = var_549, x = var_548_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor encoder_layers_0_self_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_self_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16291264))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17339904))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_0_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17342016)))]; tensor linear_7_cast_fp16 = linear(bias = encoder_layers_0_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_0_self_attn_linear_out_weight_to_fp16_quantized, x = input_43_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor input_47_cast_fp16 = add(x = input_37_cast_fp16, y = linear_7_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor x_17_axes_0 = const()[name = tensor("x_17_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17344128)))]; tensor encoder_layers_0_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17346240)))]; tensor x_17_cast_fp16 = layer_norm(axes = x_17_axes_0, beta = encoder_layers_0_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_0_norm_conv_weight_to_fp16, x = input_47_cast_fp16)[name = tensor("x_17_cast_fp16")]; tensor input_49_perm_0 = const()[name = tensor("input_49_perm_0"), val = tensor([0, 2, 1])]; tensor input_51_pad_type_0 = const()[name = tensor("input_51_pad_type_0"), val = tensor("valid")]; tensor input_51_strides_0 = const()[name = tensor("input_51_strides_0"), val = tensor([1])]; tensor input_51_pad_0 = const()[name = tensor("input_51_pad_0"), val = tensor([0, 0])]; tensor input_51_dilations_0 = const()[name = tensor("input_51_dilations_0"), val = tensor([1])]; tensor input_51_groups_0 = const()[name = tensor("input_51_groups_0"), val = tensor(1)]; tensor encoder_layers_0_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17348352))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19447680))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_49_cast_fp16 = transpose(perm = input_49_perm_0, x = x_17_cast_fp16)[name = tensor("transpose_357")]; tensor input_51_cast_fp16 = conv(dilations = input_51_dilations_0, groups = input_51_groups_0, pad = input_51_pad_0, pad_type = input_51_pad_type_0, strides = input_51_strides_0, weight = encoder_layers_0_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_49_cast_fp16)[name = tensor("input_51_cast_fp16")]; tensor x_19_split_num_splits_0 = const()[name = tensor("x_19_split_num_splits_0"), val = tensor(2)]; tensor x_19_split_axis_0 = const()[name = tensor("x_19_split_axis_0"), val = tensor(1)]; tensor x_19_split_cast_fp16_0, tensor x_19_split_cast_fp16_1 = split(axis = x_19_split_axis_0, num_splits = x_19_split_num_splits_0, x = input_51_cast_fp16)[name = tensor("x_19_split_cast_fp16")]; tensor x_19_split_1_sigmoid_cast_fp16 = sigmoid(x = x_19_split_cast_fp16_1)[name = tensor("x_19_split_1_sigmoid_cast_fp16")]; tensor x_19_cast_fp16 = mul(x = x_19_split_cast_fp16_0, y = x_19_split_1_sigmoid_cast_fp16)[name = tensor("x_19_cast_fp16")]; tensor var_575_axes_0 = const()[name = tensor("op_575_axes_0"), val = tensor([1])]; tensor var_575 = expand_dims(axes = var_575_axes_0, x = pad_mask)[name = tensor("op_575")]; tensor input_53_cast_fp16 = select(a = var_44_to_fp16, b = x_19_cast_fp16, cond = var_575)[name = tensor("input_53_cast_fp16")]; tensor new_x_3_interleave_0 = const()[name = tensor("new_x_3_interleave_0"), val = tensor(false)]; tensor new_x_3_cast_fp16 = concat(axis = var_59, interleave = new_x_3_interleave_0, values = (cache_3_cast_fp16, input_53_cast_fp16))[name = tensor("new_x_3_cast_fp16")]; tensor var_588_begin_0 = const()[name = tensor("op_588_begin_0"), val = tensor([0, 0, 7])]; tensor var_588_end_0 = const()[name = tensor("op_588_end_0"), val = tensor([1, 1024, 15])]; tensor var_588_end_mask_0 = const()[name = tensor("op_588_end_mask_0"), val = tensor([true, true, true])]; tensor var_588_cast_fp16 = slice_by_index(begin = var_588_begin_0, end = var_588_end_0, end_mask = var_588_end_mask_0, x = new_x_3_cast_fp16)[name = tensor("op_588_cast_fp16")]; tensor x_21_pad_type_0 = const()[name = tensor("x_21_pad_type_0"), val = tensor("valid")]; tensor x_21_groups_0 = const()[name = tensor("x_21_groups_0"), val = tensor(1024)]; tensor x_21_strides_0 = const()[name = tensor("x_21_strides_0"), val = tensor([1])]; tensor x_21_pad_0 = const()[name = tensor("x_21_pad_0"), val = tensor([0, 0])]; tensor x_21_dilations_0 = const()[name = tensor("x_21_dilations_0"), val = tensor([1])]; tensor encoder_layers_0_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19451840))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19461120))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_21_cast_fp16 = conv(dilations = x_21_dilations_0, groups = x_21_groups_0, pad = x_21_pad_0, pad_type = x_21_pad_type_0, strides = x_21_strides_0, weight = encoder_layers_0_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_3_cast_fp16)[name = tensor("x_21_cast_fp16")]; tensor input_55_perm_0 = const()[name = tensor("input_55_perm_0"), val = tensor([0, 2, 1])]; tensor x_23_axes_0 = const()[name = tensor("x_23_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_0_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19463232)))]; tensor encoder_layers_0_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_0_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19465344)))]; tensor input_55_cast_fp16 = transpose(perm = input_55_perm_0, x = x_21_cast_fp16)[name = tensor("transpose_356")]; tensor x_23_cast_fp16 = layer_norm(axes = x_23_axes_0, beta = encoder_layers_0_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_0_conv_batch_norm_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("x_23_cast_fp16")]; tensor input_57_perm_0 = const()[name = tensor("input_57_perm_0"), val = tensor([0, 2, 1])]; tensor input_57_cast_fp16 = transpose(perm = input_57_perm_0, x = x_23_cast_fp16)[name = tensor("transpose_355")]; tensor input_59_cast_fp16 = silu(x = input_57_cast_fp16)[name = tensor("input_59_cast_fp16")]; tensor x_25_pad_type_0 = const()[name = tensor("x_25_pad_type_0"), val = tensor("valid")]; tensor x_25_strides_0 = const()[name = tensor("x_25_strides_0"), val = tensor([1])]; tensor x_25_pad_0 = const()[name = tensor("x_25_pad_0"), val = tensor([0, 0])]; tensor x_25_dilations_0 = const()[name = tensor("x_25_dilations_0"), val = tensor([1])]; tensor x_25_groups_0 = const()[name = tensor("x_25_groups_0"), val = tensor(1)]; tensor encoder_layers_0_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19467456))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20516096))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_25_cast_fp16 = conv(dilations = x_25_dilations_0, groups = x_25_groups_0, pad = x_25_pad_0, pad_type = x_25_pad_type_0, strides = x_25_strides_0, weight = encoder_layers_0_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_59_cast_fp16)[name = tensor("x_25_cast_fp16")]; tensor input_61_perm_0 = const()[name = tensor("input_61_perm_0"), val = tensor([0, 2, 1])]; tensor input_61_cast_fp16 = transpose(perm = input_61_perm_0, x = x_25_cast_fp16)[name = tensor("transpose_354")]; tensor input_63_cast_fp16 = add(x = input_47_cast_fp16, y = input_61_cast_fp16)[name = tensor("input_63_cast_fp16")]; tensor input_65_axes_0 = const()[name = tensor("input_65_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20518208)))]; tensor encoder_layers_0_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20520320)))]; tensor input_65_cast_fp16 = layer_norm(axes = input_65_axes_0, beta = encoder_layers_0_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_0_norm_feed_forward2_weight_to_fp16, x = input_63_cast_fp16)[name = tensor("input_65_cast_fp16")]; tensor encoder_layers_0_feed_forward2_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_feed_forward2_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20522432))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24716800))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_0_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_0_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24725056)))]; tensor linear_8_cast_fp16 = linear(bias = encoder_layers_0_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_0_feed_forward2_linear1_weight_to_fp16_quantized, x = input_65_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor input_69_cast_fp16 = silu(x = linear_8_cast_fp16)[name = tensor("input_69_cast_fp16")]; tensor encoder_layers_0_feed_forward2_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_0_feed_forward2_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24733312))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28927680))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_0_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_0_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28929792)))]; tensor linear_9_cast_fp16 = linear(bias = encoder_layers_0_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_0_feed_forward2_linear2_weight_to_fp16_quantized, x = input_69_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor var_631_to_fp16 = const()[name = tensor("op_631_to_fp16"), val = tensor(0x1p-1)]; tensor var_632_cast_fp16 = mul(x = linear_9_cast_fp16, y = var_631_to_fp16)[name = tensor("op_632_cast_fp16")]; tensor input_75_cast_fp16 = add(x = input_63_cast_fp16, y = var_632_cast_fp16)[name = tensor("input_75_cast_fp16")]; tensor input_77_axes_0 = const()[name = tensor("input_77_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28931904)))]; tensor encoder_layers_0_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28934016)))]; tensor input_77_cast_fp16 = layer_norm(axes = input_77_axes_0, beta = encoder_layers_0_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_0_norm_out_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("input_77_cast_fp16")]; tensor cache_5_begin_0 = const()[name = tensor("cache_5_begin_0"), val = tensor([1, 0, 0, 0])]; tensor cache_5_end_0 = const()[name = tensor("cache_5_end_0"), val = tensor([2, 1, 42, 1024])]; tensor cache_5_end_mask_0 = const()[name = tensor("cache_5_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_5_squeeze_mask_0 = const()[name = tensor("cache_5_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_5_cast_fp16 = slice_by_index(begin = cache_5_begin_0, end = cache_5_end_0, end_mask = cache_5_end_mask_0, squeeze_mask = cache_5_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_5_cast_fp16")]; tensor cache_7_begin_0 = const()[name = tensor("cache_7_begin_0"), val = tensor([1, 0, 0, 0])]; tensor cache_7_end_0 = const()[name = tensor("cache_7_end_0"), val = tensor([2, 1, 1024, 8])]; tensor cache_7_end_mask_0 = const()[name = tensor("cache_7_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_7_squeeze_mask_0 = const()[name = tensor("cache_7_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_7_cast_fp16 = slice_by_index(begin = cache_7_begin_0, end = cache_7_end_0, end_mask = cache_7_end_mask_0, squeeze_mask = cache_7_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_7_cast_fp16")]; tensor input_79_axes_0 = const()[name = tensor("input_79_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28936128)))]; tensor encoder_layers_1_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28938240)))]; tensor input_79_cast_fp16 = layer_norm(axes = input_79_axes_0, beta = encoder_layers_1_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_1_norm_feed_forward1_weight_to_fp16, x = input_77_cast_fp16)[name = tensor("input_79_cast_fp16")]; tensor encoder_layers_1_feed_forward1_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_feed_forward1_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28940352))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33134720))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_1_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_1_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33142976)))]; tensor linear_10_cast_fp16 = linear(bias = encoder_layers_1_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_1_feed_forward1_linear1_weight_to_fp16_quantized, x = input_79_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor input_83_cast_fp16 = silu(x = linear_10_cast_fp16)[name = tensor("input_83_cast_fp16")]; tensor encoder_layers_1_feed_forward1_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_feed_forward1_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33151232))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37345600))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_1_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_1_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37347712)))]; tensor linear_11_cast_fp16 = linear(bias = encoder_layers_1_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_1_feed_forward1_linear2_weight_to_fp16_quantized, x = input_83_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor var_668_to_fp16 = const()[name = tensor("op_668_to_fp16"), val = tensor(0x1p-1)]; tensor var_669_cast_fp16 = mul(x = linear_11_cast_fp16, y = var_668_to_fp16)[name = tensor("op_669_cast_fp16")]; tensor input_89_cast_fp16 = add(x = input_77_cast_fp16, y = var_669_cast_fp16)[name = tensor("input_89_cast_fp16")]; tensor key_3_axes_0 = const()[name = tensor("key_3_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37349824)))]; tensor encoder_layers_1_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37351936)))]; tensor key_3_cast_fp16 = layer_norm(axes = key_3_axes_0, beta = encoder_layers_1_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_1_norm_self_att_weight_to_fp16, x = input_89_cast_fp16)[name = tensor("key_3_cast_fp16")]; tensor input_91_interleave_0 = const()[name = tensor("input_91_interleave_0"), val = tensor(false)]; tensor input_91_cast_fp16 = concat(axis = var_68, interleave = input_91_interleave_0, values = (cache_5_cast_fp16, key_3_cast_fp16))[name = tensor("input_91_cast_fp16")]; tensor var_691_begin_0 = const()[name = tensor("op_691_begin_0"), val = tensor([0, 7, 0])]; tensor var_691_end_0 = const()[name = tensor("op_691_end_0"), val = tensor([1, 42, 1024])]; tensor var_691_end_mask_0 = const()[name = tensor("op_691_end_mask_0"), val = tensor([true, true, true])]; tensor var_691_cast_fp16 = slice_by_index(begin = var_691_begin_0, end = var_691_end_0, end_mask = var_691_end_mask_0, x = cache_5_cast_fp16)[name = tensor("op_691_cast_fp16")]; tensor var_697_interleave_0 = const()[name = tensor("op_697_interleave_0"), val = tensor(false)]; tensor var_697_cast_fp16 = concat(axis = var_68, interleave = var_697_interleave_0, values = (var_691_cast_fp16, key_3_cast_fp16))[name = tensor("op_697_cast_fp16")]; tensor encoder_layers_1_self_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_self_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37354048))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38402688))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_1_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38404800)))]; tensor linear_12_cast_fp16 = linear(bias = encoder_layers_1_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_1_self_attn_linear_q_weight_to_fp16_quantized, x = key_3_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor var_702 = const()[name = tensor("op_702"), val = tensor([1, -1, 8, 128])]; tensor q_7_cast_fp16 = reshape(shape = var_702, x = linear_12_cast_fp16)[name = tensor("q_7_cast_fp16")]; tensor encoder_layers_1_self_attn_linear_k_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_self_attn_linear_k_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38406912))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39455552))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_1_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39457664)))]; tensor linear_13_cast_fp16 = linear(bias = encoder_layers_1_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_1_self_attn_linear_k_weight_to_fp16_quantized, x = input_91_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor var_707 = const()[name = tensor("op_707"), val = tensor([1, -1, 8, 128])]; tensor k_5_cast_fp16 = reshape(shape = var_707, x = linear_13_cast_fp16)[name = tensor("k_5_cast_fp16")]; tensor encoder_layers_1_self_attn_linear_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_self_attn_linear_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39459776))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40508416))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_1_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40510528)))]; tensor linear_14_cast_fp16 = linear(bias = encoder_layers_1_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_1_self_attn_linear_v_weight_to_fp16_quantized, x = input_91_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor var_712 = const()[name = tensor("op_712"), val = tensor([1, -1, 8, 128])]; tensor v_3_cast_fp16 = reshape(shape = var_712, x = linear_14_cast_fp16)[name = tensor("v_3_cast_fp16")]; tensor value_11_perm_0 = const()[name = tensor("value_11_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_1_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40512640)))]; tensor var_725_cast_fp16 = add(x = q_7_cast_fp16, y = encoder_layers_1_self_attn_pos_bias_u_to_fp16)[name = tensor("op_725_cast_fp16")]; tensor encoder_layers_1_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40514752)))]; tensor var_727_cast_fp16 = add(x = q_7_cast_fp16, y = encoder_layers_1_self_attn_pos_bias_v_to_fp16)[name = tensor("op_727_cast_fp16")]; tensor q_with_bias_v_3_perm_0 = const()[name = tensor("q_with_bias_v_3_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_33_transpose_x_0 = const()[name = tensor("x_33_transpose_x_0"), val = tensor(false)]; tensor x_33_transpose_y_0 = const()[name = tensor("x_33_transpose_y_0"), val = tensor(false)]; tensor op_729_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_729_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40516864))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40616448))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40616256)))]; tensor q_with_bias_v_3_cast_fp16 = transpose(perm = q_with_bias_v_3_perm_0, x = var_727_cast_fp16)[name = tensor("transpose_353")]; tensor x_33_cast_fp16 = matmul(transpose_x = x_33_transpose_x_0, transpose_y = x_33_transpose_y_0, x = q_with_bias_v_3_cast_fp16, y = op_729_to_fp16_quantized)[name = tensor("x_33_cast_fp16")]; tensor x_35_pad_0 = const()[name = tensor("x_35_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_35_mode_0 = const()[name = tensor("x_35_mode_0"), val = tensor("constant")]; tensor const_92_to_fp16 = const()[name = tensor("const_92_to_fp16"), val = tensor(0x0p+0)]; tensor x_35_cast_fp16 = pad(constant_val = const_92_to_fp16, mode = x_35_mode_0, pad = x_35_pad_0, x = x_33_cast_fp16)[name = tensor("x_35_cast_fp16")]; tensor var_737 = const()[name = tensor("op_737"), val = tensor([1, 8, -1, 7])]; tensor x_37_cast_fp16 = reshape(shape = var_737, x = x_35_cast_fp16)[name = tensor("x_37_cast_fp16")]; tensor var_741_begin_0 = const()[name = tensor("op_741_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_741_end_0 = const()[name = tensor("op_741_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_741_end_mask_0 = const()[name = tensor("op_741_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_741_cast_fp16 = slice_by_index(begin = var_741_begin_0, end = var_741_end_0, end_mask = var_741_end_mask_0, x = x_37_cast_fp16)[name = tensor("op_741_cast_fp16")]; tensor var_742 = const()[name = tensor("op_742"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_5_cast_fp16 = reshape(shape = var_742, x = var_741_cast_fp16)[name = tensor("matrix_bd_5_cast_fp16")]; tensor matrix_ac_3_transpose_x_0 = const()[name = tensor("matrix_ac_3_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_3_transpose_y_0 = const()[name = tensor("matrix_ac_3_transpose_y_0"), val = tensor(false)]; tensor transpose_98_perm_0 = const()[name = tensor("transpose_98_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_99_perm_0 = const()[name = tensor("transpose_99_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_99 = transpose(perm = transpose_99_perm_0, x = k_5_cast_fp16)[name = tensor("transpose_351")]; tensor transpose_98 = transpose(perm = transpose_98_perm_0, x = var_725_cast_fp16)[name = tensor("transpose_352")]; tensor matrix_ac_3_cast_fp16 = matmul(transpose_x = matrix_ac_3_transpose_x_0, transpose_y = matrix_ac_3_transpose_y_0, x = transpose_98, y = transpose_99)[name = tensor("matrix_ac_3_cast_fp16")]; tensor matrix_bd_7_begin_0 = const()[name = tensor("matrix_bd_7_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_7_end_0 = const()[name = tensor("matrix_bd_7_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_7_end_mask_0 = const()[name = tensor("matrix_bd_7_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_7_cast_fp16 = slice_by_index(begin = matrix_bd_7_begin_0, end = matrix_bd_7_end_0, end_mask = matrix_bd_7_end_mask_0, x = matrix_bd_5_cast_fp16)[name = tensor("matrix_bd_7_cast_fp16")]; tensor var_751_cast_fp16 = add(x = matrix_ac_3_cast_fp16, y = matrix_bd_7_cast_fp16)[name = tensor("op_751_cast_fp16")]; tensor _inversed_scores_5_y_0_to_fp16 = const()[name = tensor("_inversed_scores_5_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_5_cast_fp16 = mul(x = var_751_cast_fp16, y = _inversed_scores_5_y_0_to_fp16)[name = tensor("_inversed_scores_5_cast_fp16")]; tensor scores_7_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_5_cast_fp16, cond = mask_11)[name = tensor("scores_7_cast_fp16")]; tensor var_757_cast_fp16 = softmax(axis = var_59, x = scores_7_cast_fp16)[name = tensor("op_757_cast_fp16")]; tensor input_93_cast_fp16 = select(a = var_44_to_fp16, b = var_757_cast_fp16, cond = mask_11)[name = tensor("input_93_cast_fp16")]; tensor x_39_transpose_x_0 = const()[name = tensor("x_39_transpose_x_0"), val = tensor(false)]; tensor x_39_transpose_y_0 = const()[name = tensor("x_39_transpose_y_0"), val = tensor(false)]; tensor value_11_cast_fp16 = transpose(perm = value_11_perm_0, x = v_3_cast_fp16)[name = tensor("transpose_350")]; tensor x_39_cast_fp16 = matmul(transpose_x = x_39_transpose_x_0, transpose_y = x_39_transpose_y_0, x = input_93_cast_fp16, y = value_11_cast_fp16)[name = tensor("x_39_cast_fp16")]; tensor var_761_perm_0 = const()[name = tensor("op_761_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_762 = const()[name = tensor("op_762"), val = tensor([1, -1, 1024])]; tensor var_761_cast_fp16 = transpose(perm = var_761_perm_0, x = x_39_cast_fp16)[name = tensor("transpose_349")]; tensor input_95_cast_fp16 = reshape(shape = var_762, x = var_761_cast_fp16)[name = tensor("input_95_cast_fp16")]; tensor encoder_layers_1_self_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_self_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40616768))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41665408))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_1_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41667520)))]; tensor linear_16_cast_fp16 = linear(bias = encoder_layers_1_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_1_self_attn_linear_out_weight_to_fp16_quantized, x = input_95_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor input_99_cast_fp16 = add(x = input_89_cast_fp16, y = linear_16_cast_fp16)[name = tensor("input_99_cast_fp16")]; tensor x_43_axes_0 = const()[name = tensor("x_43_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41669632)))]; tensor encoder_layers_1_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41671744)))]; tensor x_43_cast_fp16 = layer_norm(axes = x_43_axes_0, beta = encoder_layers_1_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_1_norm_conv_weight_to_fp16, x = input_99_cast_fp16)[name = tensor("x_43_cast_fp16")]; tensor input_101_perm_0 = const()[name = tensor("input_101_perm_0"), val = tensor([0, 2, 1])]; tensor input_103_pad_type_0 = const()[name = tensor("input_103_pad_type_0"), val = tensor("valid")]; tensor input_103_strides_0 = const()[name = tensor("input_103_strides_0"), val = tensor([1])]; tensor input_103_pad_0 = const()[name = tensor("input_103_pad_0"), val = tensor([0, 0])]; tensor input_103_dilations_0 = const()[name = tensor("input_103_dilations_0"), val = tensor([1])]; tensor input_103_groups_0 = const()[name = tensor("input_103_groups_0"), val = tensor(1)]; tensor encoder_layers_1_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41673856))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43771072))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_101_cast_fp16 = transpose(perm = input_101_perm_0, x = x_43_cast_fp16)[name = tensor("transpose_348")]; tensor input_103_cast_fp16 = conv(dilations = input_103_dilations_0, groups = input_103_groups_0, pad = input_103_pad_0, pad_type = input_103_pad_type_0, strides = input_103_strides_0, weight = encoder_layers_1_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_101_cast_fp16)[name = tensor("input_103_cast_fp16")]; tensor x_45_split_num_splits_0 = const()[name = tensor("x_45_split_num_splits_0"), val = tensor(2)]; tensor x_45_split_axis_0 = const()[name = tensor("x_45_split_axis_0"), val = tensor(1)]; tensor x_45_split_cast_fp16_0, tensor x_45_split_cast_fp16_1 = split(axis = x_45_split_axis_0, num_splits = x_45_split_num_splits_0, x = input_103_cast_fp16)[name = tensor("x_45_split_cast_fp16")]; tensor x_45_split_1_sigmoid_cast_fp16 = sigmoid(x = x_45_split_cast_fp16_1)[name = tensor("x_45_split_1_sigmoid_cast_fp16")]; tensor x_45_cast_fp16 = mul(x = x_45_split_cast_fp16_0, y = x_45_split_1_sigmoid_cast_fp16)[name = tensor("x_45_cast_fp16")]; tensor input_105_cast_fp16 = select(a = var_44_to_fp16, b = x_45_cast_fp16, cond = var_575)[name = tensor("input_105_cast_fp16")]; tensor new_x_7_interleave_0 = const()[name = tensor("new_x_7_interleave_0"), val = tensor(false)]; tensor new_x_7_cast_fp16 = concat(axis = var_59, interleave = new_x_7_interleave_0, values = (cache_7_cast_fp16, input_105_cast_fp16))[name = tensor("new_x_7_cast_fp16")]; tensor var_801_begin_0 = const()[name = tensor("op_801_begin_0"), val = tensor([0, 0, 7])]; tensor var_801_end_0 = const()[name = tensor("op_801_end_0"), val = tensor([1, 1024, 15])]; tensor var_801_end_mask_0 = const()[name = tensor("op_801_end_mask_0"), val = tensor([true, true, true])]; tensor var_801_cast_fp16 = slice_by_index(begin = var_801_begin_0, end = var_801_end_0, end_mask = var_801_end_mask_0, x = new_x_7_cast_fp16)[name = tensor("op_801_cast_fp16")]; tensor x_47_pad_type_0 = const()[name = tensor("x_47_pad_type_0"), val = tensor("valid")]; tensor x_47_groups_0 = const()[name = tensor("x_47_groups_0"), val = tensor(1024)]; tensor x_47_strides_0 = const()[name = tensor("x_47_strides_0"), val = tensor([1])]; tensor x_47_pad_0 = const()[name = tensor("x_47_pad_0"), val = tensor([0, 0])]; tensor x_47_dilations_0 = const()[name = tensor("x_47_dilations_0"), val = tensor([1])]; tensor encoder_layers_1_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43775232))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43784512))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_47_cast_fp16 = conv(dilations = x_47_dilations_0, groups = x_47_groups_0, pad = x_47_pad_0, pad_type = x_47_pad_type_0, strides = x_47_strides_0, weight = encoder_layers_1_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_7_cast_fp16)[name = tensor("x_47_cast_fp16")]; tensor input_107_perm_0 = const()[name = tensor("input_107_perm_0"), val = tensor([0, 2, 1])]; tensor x_49_axes_0 = const()[name = tensor("x_49_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_1_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43786624)))]; tensor encoder_layers_1_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_1_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43788736)))]; tensor input_107_cast_fp16 = transpose(perm = input_107_perm_0, x = x_47_cast_fp16)[name = tensor("transpose_347")]; tensor x_49_cast_fp16 = layer_norm(axes = x_49_axes_0, beta = encoder_layers_1_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_1_conv_batch_norm_weight_to_fp16, x = input_107_cast_fp16)[name = tensor("x_49_cast_fp16")]; tensor input_109_perm_0 = const()[name = tensor("input_109_perm_0"), val = tensor([0, 2, 1])]; tensor input_109_cast_fp16 = transpose(perm = input_109_perm_0, x = x_49_cast_fp16)[name = tensor("transpose_346")]; tensor input_111_cast_fp16 = silu(x = input_109_cast_fp16)[name = tensor("input_111_cast_fp16")]; tensor x_51_pad_type_0 = const()[name = tensor("x_51_pad_type_0"), val = tensor("valid")]; tensor x_51_strides_0 = const()[name = tensor("x_51_strides_0"), val = tensor([1])]; tensor x_51_pad_0 = const()[name = tensor("x_51_pad_0"), val = tensor([0, 0])]; tensor x_51_dilations_0 = const()[name = tensor("x_51_dilations_0"), val = tensor([1])]; tensor x_51_groups_0 = const()[name = tensor("x_51_groups_0"), val = tensor(1)]; tensor encoder_layers_1_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43790848))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44839488))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_51_cast_fp16 = conv(dilations = x_51_dilations_0, groups = x_51_groups_0, pad = x_51_pad_0, pad_type = x_51_pad_type_0, strides = x_51_strides_0, weight = encoder_layers_1_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_111_cast_fp16)[name = tensor("x_51_cast_fp16")]; tensor input_113_perm_0 = const()[name = tensor("input_113_perm_0"), val = tensor([0, 2, 1])]; tensor input_113_cast_fp16 = transpose(perm = input_113_perm_0, x = x_51_cast_fp16)[name = tensor("transpose_345")]; tensor input_115_cast_fp16 = add(x = input_99_cast_fp16, y = input_113_cast_fp16)[name = tensor("input_115_cast_fp16")]; tensor input_117_axes_0 = const()[name = tensor("input_117_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44841600)))]; tensor encoder_layers_1_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44843712)))]; tensor input_117_cast_fp16 = layer_norm(axes = input_117_axes_0, beta = encoder_layers_1_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_1_norm_feed_forward2_weight_to_fp16, x = input_115_cast_fp16)[name = tensor("input_117_cast_fp16")]; tensor encoder_layers_1_feed_forward2_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_feed_forward2_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44845824))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49040192))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_1_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_1_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49048448)))]; tensor linear_17_cast_fp16 = linear(bias = encoder_layers_1_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_1_feed_forward2_linear1_weight_to_fp16_quantized, x = input_117_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor input_121_cast_fp16 = silu(x = linear_17_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor encoder_layers_1_feed_forward2_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_1_feed_forward2_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49056704))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53251072))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_1_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_1_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53253184)))]; tensor linear_18_cast_fp16 = linear(bias = encoder_layers_1_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_1_feed_forward2_linear2_weight_to_fp16_quantized, x = input_121_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor var_844_to_fp16 = const()[name = tensor("op_844_to_fp16"), val = tensor(0x1p-1)]; tensor var_845_cast_fp16 = mul(x = linear_18_cast_fp16, y = var_844_to_fp16)[name = tensor("op_845_cast_fp16")]; tensor input_127_cast_fp16 = add(x = input_115_cast_fp16, y = var_845_cast_fp16)[name = tensor("input_127_cast_fp16")]; tensor input_129_axes_0 = const()[name = tensor("input_129_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53255296)))]; tensor encoder_layers_1_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53257408)))]; tensor input_129_cast_fp16 = layer_norm(axes = input_129_axes_0, beta = encoder_layers_1_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_1_norm_out_weight_to_fp16, x = input_127_cast_fp16)[name = tensor("input_129_cast_fp16")]; tensor cache_9_begin_0 = const()[name = tensor("cache_9_begin_0"), val = tensor([2, 0, 0, 0])]; tensor cache_9_end_0 = const()[name = tensor("cache_9_end_0"), val = tensor([3, 1, 42, 1024])]; tensor cache_9_end_mask_0 = const()[name = tensor("cache_9_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_9_squeeze_mask_0 = const()[name = tensor("cache_9_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_9_cast_fp16 = slice_by_index(begin = cache_9_begin_0, end = cache_9_end_0, end_mask = cache_9_end_mask_0, squeeze_mask = cache_9_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_9_cast_fp16")]; tensor cache_11_begin_0 = const()[name = tensor("cache_11_begin_0"), val = tensor([2, 0, 0, 0])]; tensor cache_11_end_0 = const()[name = tensor("cache_11_end_0"), val = tensor([3, 1, 1024, 8])]; tensor cache_11_end_mask_0 = const()[name = tensor("cache_11_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_11_squeeze_mask_0 = const()[name = tensor("cache_11_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_11_cast_fp16 = slice_by_index(begin = cache_11_begin_0, end = cache_11_end_0, end_mask = cache_11_end_mask_0, squeeze_mask = cache_11_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_11_cast_fp16")]; tensor input_131_axes_0 = const()[name = tensor("input_131_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53259520)))]; tensor encoder_layers_2_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53261632)))]; tensor input_131_cast_fp16 = layer_norm(axes = input_131_axes_0, beta = encoder_layers_2_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_2_norm_feed_forward1_weight_to_fp16, x = input_129_cast_fp16)[name = tensor("input_131_cast_fp16")]; tensor encoder_layers_2_feed_forward1_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_2_feed_forward1_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53263744))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57458112))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_2_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_2_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57466368)))]; tensor linear_19_cast_fp16 = linear(bias = encoder_layers_2_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_2_feed_forward1_linear1_weight_to_fp16_quantized, x = input_131_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor input_135_cast_fp16 = silu(x = linear_19_cast_fp16)[name = tensor("input_135_cast_fp16")]; tensor encoder_layers_2_feed_forward1_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_2_feed_forward1_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57474624))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61668992))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_2_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_2_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61671104)))]; tensor linear_20_cast_fp16 = linear(bias = encoder_layers_2_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_2_feed_forward1_linear2_weight_to_fp16_quantized, x = input_135_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor var_881_to_fp16 = const()[name = tensor("op_881_to_fp16"), val = tensor(0x1p-1)]; tensor var_882_cast_fp16 = mul(x = linear_20_cast_fp16, y = var_881_to_fp16)[name = tensor("op_882_cast_fp16")]; tensor input_141_cast_fp16 = add(x = input_129_cast_fp16, y = var_882_cast_fp16)[name = tensor("input_141_cast_fp16")]; tensor key_5_axes_0 = const()[name = tensor("key_5_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61673216)))]; tensor encoder_layers_2_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61675328)))]; tensor key_5_cast_fp16 = layer_norm(axes = key_5_axes_0, beta = encoder_layers_2_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_2_norm_self_att_weight_to_fp16, x = input_141_cast_fp16)[name = tensor("key_5_cast_fp16")]; tensor input_143_interleave_0 = const()[name = tensor("input_143_interleave_0"), val = tensor(false)]; tensor input_143_cast_fp16 = concat(axis = var_68, interleave = input_143_interleave_0, values = (cache_9_cast_fp16, key_5_cast_fp16))[name = tensor("input_143_cast_fp16")]; tensor var_904_begin_0 = const()[name = tensor("op_904_begin_0"), val = tensor([0, 7, 0])]; tensor var_904_end_0 = const()[name = tensor("op_904_end_0"), val = tensor([1, 42, 1024])]; tensor var_904_end_mask_0 = const()[name = tensor("op_904_end_mask_0"), val = tensor([true, true, true])]; tensor var_904_cast_fp16 = slice_by_index(begin = var_904_begin_0, end = var_904_end_0, end_mask = var_904_end_mask_0, x = cache_9_cast_fp16)[name = tensor("op_904_cast_fp16")]; tensor var_910_interleave_0 = const()[name = tensor("op_910_interleave_0"), val = tensor(false)]; tensor var_910_cast_fp16 = concat(axis = var_68, interleave = var_910_interleave_0, values = (var_904_cast_fp16, key_5_cast_fp16))[name = tensor("op_910_cast_fp16")]; tensor encoder_layers_2_self_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_2_self_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61677440))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(62726080))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_2_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(62728192)))]; tensor linear_21_cast_fp16 = linear(bias = encoder_layers_2_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_2_self_attn_linear_q_weight_to_fp16_quantized, x = key_5_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor var_915 = const()[name = tensor("op_915"), val = tensor([1, -1, 8, 128])]; tensor q_13_cast_fp16 = reshape(shape = var_915, x = linear_21_cast_fp16)[name = tensor("q_13_cast_fp16")]; tensor encoder_layers_2_self_attn_linear_k_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_2_self_attn_linear_k_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(62730304))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63778944))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_2_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63781056)))]; tensor linear_22_cast_fp16 = linear(bias = encoder_layers_2_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_2_self_attn_linear_k_weight_to_fp16_quantized, x = input_143_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor var_920 = const()[name = tensor("op_920"), val = tensor([1, -1, 8, 128])]; tensor k_9_cast_fp16 = reshape(shape = var_920, x = linear_22_cast_fp16)[name = tensor("k_9_cast_fp16")]; tensor encoder_layers_2_self_attn_linear_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_2_self_attn_linear_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63783168))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64831808))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_2_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64833920)))]; tensor linear_23_cast_fp16 = linear(bias = encoder_layers_2_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_2_self_attn_linear_v_weight_to_fp16_quantized, x = input_143_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor var_925 = const()[name = tensor("op_925"), val = tensor([1, -1, 8, 128])]; tensor v_5_cast_fp16 = reshape(shape = var_925, x = linear_23_cast_fp16)[name = tensor("v_5_cast_fp16")]; tensor value_13_perm_0 = const()[name = tensor("value_13_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_2_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64836032)))]; tensor var_938_cast_fp16 = add(x = q_13_cast_fp16, y = encoder_layers_2_self_attn_pos_bias_u_to_fp16)[name = tensor("op_938_cast_fp16")]; tensor encoder_layers_2_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64838144)))]; tensor var_940_cast_fp16 = add(x = q_13_cast_fp16, y = encoder_layers_2_self_attn_pos_bias_v_to_fp16)[name = tensor("op_940_cast_fp16")]; tensor q_with_bias_v_5_perm_0 = const()[name = tensor("q_with_bias_v_5_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_59_transpose_x_0 = const()[name = tensor("x_59_transpose_x_0"), val = tensor(false)]; tensor x_59_transpose_y_0 = const()[name = tensor("x_59_transpose_y_0"), val = tensor(false)]; tensor op_942_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_942_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64840256))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64939840))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64939648)))]; tensor q_with_bias_v_5_cast_fp16 = transpose(perm = q_with_bias_v_5_perm_0, x = var_940_cast_fp16)[name = tensor("transpose_344")]; tensor x_59_cast_fp16 = matmul(transpose_x = x_59_transpose_x_0, transpose_y = x_59_transpose_y_0, x = q_with_bias_v_5_cast_fp16, y = op_942_to_fp16_quantized)[name = tensor("x_59_cast_fp16")]; tensor x_61_pad_0 = const()[name = tensor("x_61_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_61_mode_0 = const()[name = tensor("x_61_mode_0"), val = tensor("constant")]; tensor const_105_to_fp16 = const()[name = tensor("const_105_to_fp16"), val = tensor(0x0p+0)]; tensor x_61_cast_fp16 = pad(constant_val = const_105_to_fp16, mode = x_61_mode_0, pad = x_61_pad_0, x = x_59_cast_fp16)[name = tensor("x_61_cast_fp16")]; tensor var_950 = const()[name = tensor("op_950"), val = tensor([1, 8, -1, 7])]; tensor x_63_cast_fp16 = reshape(shape = var_950, x = x_61_cast_fp16)[name = tensor("x_63_cast_fp16")]; tensor var_954_begin_0 = const()[name = tensor("op_954_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_954_end_0 = const()[name = tensor("op_954_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_954_end_mask_0 = const()[name = tensor("op_954_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_954_cast_fp16 = slice_by_index(begin = var_954_begin_0, end = var_954_end_0, end_mask = var_954_end_mask_0, x = x_63_cast_fp16)[name = tensor("op_954_cast_fp16")]; tensor var_955 = const()[name = tensor("op_955"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_9_cast_fp16 = reshape(shape = var_955, x = var_954_cast_fp16)[name = tensor("matrix_bd_9_cast_fp16")]; tensor matrix_ac_5_transpose_x_0 = const()[name = tensor("matrix_ac_5_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_5_transpose_y_0 = const()[name = tensor("matrix_ac_5_transpose_y_0"), val = tensor(false)]; tensor transpose_100_perm_0 = const()[name = tensor("transpose_100_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_101_perm_0 = const()[name = tensor("transpose_101_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_101 = transpose(perm = transpose_101_perm_0, x = k_9_cast_fp16)[name = tensor("transpose_342")]; tensor transpose_100 = transpose(perm = transpose_100_perm_0, x = var_938_cast_fp16)[name = tensor("transpose_343")]; tensor matrix_ac_5_cast_fp16 = matmul(transpose_x = matrix_ac_5_transpose_x_0, transpose_y = matrix_ac_5_transpose_y_0, x = transpose_100, y = transpose_101)[name = tensor("matrix_ac_5_cast_fp16")]; tensor matrix_bd_11_begin_0 = const()[name = tensor("matrix_bd_11_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_11_end_0 = const()[name = tensor("matrix_bd_11_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_11_end_mask_0 = const()[name = tensor("matrix_bd_11_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_11_cast_fp16 = slice_by_index(begin = matrix_bd_11_begin_0, end = matrix_bd_11_end_0, end_mask = matrix_bd_11_end_mask_0, x = matrix_bd_9_cast_fp16)[name = tensor("matrix_bd_11_cast_fp16")]; tensor var_964_cast_fp16 = add(x = matrix_ac_5_cast_fp16, y = matrix_bd_11_cast_fp16)[name = tensor("op_964_cast_fp16")]; tensor _inversed_scores_9_y_0_to_fp16 = const()[name = tensor("_inversed_scores_9_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_9_cast_fp16 = mul(x = var_964_cast_fp16, y = _inversed_scores_9_y_0_to_fp16)[name = tensor("_inversed_scores_9_cast_fp16")]; tensor scores_11_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_9_cast_fp16, cond = mask_11)[name = tensor("scores_11_cast_fp16")]; tensor var_970_cast_fp16 = softmax(axis = var_59, x = scores_11_cast_fp16)[name = tensor("op_970_cast_fp16")]; tensor input_145_cast_fp16 = select(a = var_44_to_fp16, b = var_970_cast_fp16, cond = mask_11)[name = tensor("input_145_cast_fp16")]; tensor x_65_transpose_x_0 = const()[name = tensor("x_65_transpose_x_0"), val = tensor(false)]; tensor x_65_transpose_y_0 = const()[name = tensor("x_65_transpose_y_0"), val = tensor(false)]; tensor value_13_cast_fp16 = transpose(perm = value_13_perm_0, x = v_5_cast_fp16)[name = tensor("transpose_341")]; tensor x_65_cast_fp16 = matmul(transpose_x = x_65_transpose_x_0, transpose_y = x_65_transpose_y_0, x = input_145_cast_fp16, y = value_13_cast_fp16)[name = tensor("x_65_cast_fp16")]; tensor var_974_perm_0 = const()[name = tensor("op_974_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_975 = const()[name = tensor("op_975"), val = tensor([1, -1, 1024])]; tensor var_974_cast_fp16 = transpose(perm = var_974_perm_0, x = x_65_cast_fp16)[name = tensor("transpose_340")]; tensor input_147_cast_fp16 = reshape(shape = var_975, x = var_974_cast_fp16)[name = tensor("input_147_cast_fp16")]; tensor encoder_layers_2_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64940160))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65726656))), name = tensor("encoder_layers_2_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_2_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65726848)))]; tensor linear_25_cast_fp16 = linear(bias = encoder_layers_2_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_2_self_attn_linear_out_weight_to_fp16_palettized, x = input_147_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor input_151_cast_fp16 = add(x = input_141_cast_fp16, y = linear_25_cast_fp16)[name = tensor("input_151_cast_fp16")]; tensor x_69_axes_0 = const()[name = tensor("x_69_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65728960)))]; tensor encoder_layers_2_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65731072)))]; tensor x_69_cast_fp16 = layer_norm(axes = x_69_axes_0, beta = encoder_layers_2_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_2_norm_conv_weight_to_fp16, x = input_151_cast_fp16)[name = tensor("x_69_cast_fp16")]; tensor input_153_perm_0 = const()[name = tensor("input_153_perm_0"), val = tensor([0, 2, 1])]; tensor input_155_pad_type_0 = const()[name = tensor("input_155_pad_type_0"), val = tensor("valid")]; tensor input_155_strides_0 = const()[name = tensor("input_155_strides_0"), val = tensor([1])]; tensor input_155_pad_0 = const()[name = tensor("input_155_pad_0"), val = tensor([0, 0])]; tensor input_155_dilations_0 = const()[name = tensor("input_155_dilations_0"), val = tensor([1])]; tensor input_155_groups_0 = const()[name = tensor("input_155_groups_0"), val = tensor(1)]; tensor encoder_layers_2_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_2_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65733184))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67830400))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_153_cast_fp16 = transpose(perm = input_153_perm_0, x = x_69_cast_fp16)[name = tensor("transpose_339")]; tensor input_155_cast_fp16 = conv(dilations = input_155_dilations_0, groups = input_155_groups_0, pad = input_155_pad_0, pad_type = input_155_pad_type_0, strides = input_155_strides_0, weight = encoder_layers_2_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_153_cast_fp16)[name = tensor("input_155_cast_fp16")]; tensor x_71_split_num_splits_0 = const()[name = tensor("x_71_split_num_splits_0"), val = tensor(2)]; tensor x_71_split_axis_0 = const()[name = tensor("x_71_split_axis_0"), val = tensor(1)]; tensor x_71_split_cast_fp16_0, tensor x_71_split_cast_fp16_1 = split(axis = x_71_split_axis_0, num_splits = x_71_split_num_splits_0, x = input_155_cast_fp16)[name = tensor("x_71_split_cast_fp16")]; tensor x_71_split_1_sigmoid_cast_fp16 = sigmoid(x = x_71_split_cast_fp16_1)[name = tensor("x_71_split_1_sigmoid_cast_fp16")]; tensor x_71_cast_fp16 = mul(x = x_71_split_cast_fp16_0, y = x_71_split_1_sigmoid_cast_fp16)[name = tensor("x_71_cast_fp16")]; tensor input_157_cast_fp16 = select(a = var_44_to_fp16, b = x_71_cast_fp16, cond = var_575)[name = tensor("input_157_cast_fp16")]; tensor new_x_11_interleave_0 = const()[name = tensor("new_x_11_interleave_0"), val = tensor(false)]; tensor new_x_11_cast_fp16 = concat(axis = var_59, interleave = new_x_11_interleave_0, values = (cache_11_cast_fp16, input_157_cast_fp16))[name = tensor("new_x_11_cast_fp16")]; tensor var_1014_begin_0 = const()[name = tensor("op_1014_begin_0"), val = tensor([0, 0, 7])]; tensor var_1014_end_0 = const()[name = tensor("op_1014_end_0"), val = tensor([1, 1024, 15])]; tensor var_1014_end_mask_0 = const()[name = tensor("op_1014_end_mask_0"), val = tensor([true, true, true])]; tensor var_1014_cast_fp16 = slice_by_index(begin = var_1014_begin_0, end = var_1014_end_0, end_mask = var_1014_end_mask_0, x = new_x_11_cast_fp16)[name = tensor("op_1014_cast_fp16")]; tensor x_73_pad_type_0 = const()[name = tensor("x_73_pad_type_0"), val = tensor("valid")]; tensor x_73_groups_0 = const()[name = tensor("x_73_groups_0"), val = tensor(1024)]; tensor x_73_strides_0 = const()[name = tensor("x_73_strides_0"), val = tensor([1])]; tensor x_73_pad_0 = const()[name = tensor("x_73_pad_0"), val = tensor([0, 0])]; tensor x_73_dilations_0 = const()[name = tensor("x_73_dilations_0"), val = tensor([1])]; tensor encoder_layers_2_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_2_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67834560))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67843840))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_73_cast_fp16 = conv(dilations = x_73_dilations_0, groups = x_73_groups_0, pad = x_73_pad_0, pad_type = x_73_pad_type_0, strides = x_73_strides_0, weight = encoder_layers_2_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_11_cast_fp16)[name = tensor("x_73_cast_fp16")]; tensor input_159_perm_0 = const()[name = tensor("input_159_perm_0"), val = tensor([0, 2, 1])]; tensor x_75_axes_0 = const()[name = tensor("x_75_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_2_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67845952)))]; tensor encoder_layers_2_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_2_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67848064)))]; tensor input_159_cast_fp16 = transpose(perm = input_159_perm_0, x = x_73_cast_fp16)[name = tensor("transpose_338")]; tensor x_75_cast_fp16 = layer_norm(axes = x_75_axes_0, beta = encoder_layers_2_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_2_conv_batch_norm_weight_to_fp16, x = input_159_cast_fp16)[name = tensor("x_75_cast_fp16")]; tensor input_161_perm_0 = const()[name = tensor("input_161_perm_0"), val = tensor([0, 2, 1])]; tensor input_161_cast_fp16 = transpose(perm = input_161_perm_0, x = x_75_cast_fp16)[name = tensor("transpose_337")]; tensor input_163_cast_fp16 = silu(x = input_161_cast_fp16)[name = tensor("input_163_cast_fp16")]; tensor x_77_pad_type_0 = const()[name = tensor("x_77_pad_type_0"), val = tensor("valid")]; tensor x_77_strides_0 = const()[name = tensor("x_77_strides_0"), val = tensor([1])]; tensor x_77_pad_0 = const()[name = tensor("x_77_pad_0"), val = tensor([0, 0])]; tensor x_77_dilations_0 = const()[name = tensor("x_77_dilations_0"), val = tensor([1])]; tensor x_77_groups_0 = const()[name = tensor("x_77_groups_0"), val = tensor(1)]; tensor encoder_layers_2_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_2_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67850176))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68898816))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_77_cast_fp16 = conv(dilations = x_77_dilations_0, groups = x_77_groups_0, pad = x_77_pad_0, pad_type = x_77_pad_type_0, strides = x_77_strides_0, weight = encoder_layers_2_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_163_cast_fp16)[name = tensor("x_77_cast_fp16")]; tensor input_165_perm_0 = const()[name = tensor("input_165_perm_0"), val = tensor([0, 2, 1])]; tensor input_165_cast_fp16 = transpose(perm = input_165_perm_0, x = x_77_cast_fp16)[name = tensor("transpose_336")]; tensor input_167_cast_fp16 = add(x = input_151_cast_fp16, y = input_165_cast_fp16)[name = tensor("input_167_cast_fp16")]; tensor input_169_axes_0 = const()[name = tensor("input_169_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68900928)))]; tensor encoder_layers_2_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68903040)))]; tensor input_169_cast_fp16 = layer_norm(axes = input_169_axes_0, beta = encoder_layers_2_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_2_norm_feed_forward2_weight_to_fp16, x = input_167_cast_fp16)[name = tensor("input_169_cast_fp16")]; tensor encoder_layers_2_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68905152))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72050944))), name = tensor("encoder_layers_2_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_2_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_2_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72051136)))]; tensor linear_26_cast_fp16 = linear(bias = encoder_layers_2_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_2_feed_forward2_linear1_weight_to_fp16_palettized, x = input_169_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor input_173_cast_fp16 = silu(x = linear_26_cast_fp16)[name = tensor("input_173_cast_fp16")]; tensor encoder_layers_2_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72059392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75205184))), name = tensor("encoder_layers_2_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_2_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_2_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75205376)))]; tensor linear_27_cast_fp16 = linear(bias = encoder_layers_2_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_2_feed_forward2_linear2_weight_to_fp16_palettized, x = input_173_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor var_1057_to_fp16 = const()[name = tensor("op_1057_to_fp16"), val = tensor(0x1p-1)]; tensor var_1058_cast_fp16 = mul(x = linear_27_cast_fp16, y = var_1057_to_fp16)[name = tensor("op_1058_cast_fp16")]; tensor input_179_cast_fp16 = add(x = input_167_cast_fp16, y = var_1058_cast_fp16)[name = tensor("input_179_cast_fp16")]; tensor input_181_axes_0 = const()[name = tensor("input_181_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75207488)))]; tensor encoder_layers_2_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75209600)))]; tensor input_181_cast_fp16 = layer_norm(axes = input_181_axes_0, beta = encoder_layers_2_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_2_norm_out_weight_to_fp16, x = input_179_cast_fp16)[name = tensor("input_181_cast_fp16")]; tensor cache_13_begin_0 = const()[name = tensor("cache_13_begin_0"), val = tensor([3, 0, 0, 0])]; tensor cache_13_end_0 = const()[name = tensor("cache_13_end_0"), val = tensor([4, 1, 42, 1024])]; tensor cache_13_end_mask_0 = const()[name = tensor("cache_13_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_13_squeeze_mask_0 = const()[name = tensor("cache_13_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_13_cast_fp16 = slice_by_index(begin = cache_13_begin_0, end = cache_13_end_0, end_mask = cache_13_end_mask_0, squeeze_mask = cache_13_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_13_cast_fp16")]; tensor cache_15_begin_0 = const()[name = tensor("cache_15_begin_0"), val = tensor([3, 0, 0, 0])]; tensor cache_15_end_0 = const()[name = tensor("cache_15_end_0"), val = tensor([4, 1, 1024, 8])]; tensor cache_15_end_mask_0 = const()[name = tensor("cache_15_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_15_squeeze_mask_0 = const()[name = tensor("cache_15_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_15_cast_fp16 = slice_by_index(begin = cache_15_begin_0, end = cache_15_end_0, end_mask = cache_15_end_mask_0, squeeze_mask = cache_15_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_15_cast_fp16")]; tensor input_183_axes_0 = const()[name = tensor("input_183_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75211712)))]; tensor encoder_layers_3_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75213824)))]; tensor input_183_cast_fp16 = layer_norm(axes = input_183_axes_0, beta = encoder_layers_3_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_3_norm_feed_forward1_weight_to_fp16, x = input_181_cast_fp16)[name = tensor("input_183_cast_fp16")]; tensor encoder_layers_3_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75215936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78361728))), name = tensor("encoder_layers_3_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_3_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_3_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78361920)))]; tensor linear_28_cast_fp16 = linear(bias = encoder_layers_3_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_3_feed_forward1_linear1_weight_to_fp16_palettized, x = input_183_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor input_187_cast_fp16 = silu(x = linear_28_cast_fp16)[name = tensor("input_187_cast_fp16")]; tensor encoder_layers_3_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78370176))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(81515968))), name = tensor("encoder_layers_3_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_3_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_3_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(81516160)))]; tensor linear_29_cast_fp16 = linear(bias = encoder_layers_3_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_3_feed_forward1_linear2_weight_to_fp16_palettized, x = input_187_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor var_1094_to_fp16 = const()[name = tensor("op_1094_to_fp16"), val = tensor(0x1p-1)]; tensor var_1095_cast_fp16 = mul(x = linear_29_cast_fp16, y = var_1094_to_fp16)[name = tensor("op_1095_cast_fp16")]; tensor input_193_cast_fp16 = add(x = input_181_cast_fp16, y = var_1095_cast_fp16)[name = tensor("input_193_cast_fp16")]; tensor key_7_axes_0 = const()[name = tensor("key_7_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(81518272)))]; tensor encoder_layers_3_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(81520384)))]; tensor key_7_cast_fp16 = layer_norm(axes = key_7_axes_0, beta = encoder_layers_3_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_3_norm_self_att_weight_to_fp16, x = input_193_cast_fp16)[name = tensor("key_7_cast_fp16")]; tensor input_195_interleave_0 = const()[name = tensor("input_195_interleave_0"), val = tensor(false)]; tensor input_195_cast_fp16 = concat(axis = var_68, interleave = input_195_interleave_0, values = (cache_13_cast_fp16, key_7_cast_fp16))[name = tensor("input_195_cast_fp16")]; tensor var_1117_begin_0 = const()[name = tensor("op_1117_begin_0"), val = tensor([0, 7, 0])]; tensor var_1117_end_0 = const()[name = tensor("op_1117_end_0"), val = tensor([1, 42, 1024])]; tensor var_1117_end_mask_0 = const()[name = tensor("op_1117_end_mask_0"), val = tensor([true, true, true])]; tensor var_1117_cast_fp16 = slice_by_index(begin = var_1117_begin_0, end = var_1117_end_0, end_mask = var_1117_end_mask_0, x = cache_13_cast_fp16)[name = tensor("op_1117_cast_fp16")]; tensor var_1123_interleave_0 = const()[name = tensor("op_1123_interleave_0"), val = tensor(false)]; tensor var_1123_cast_fp16 = concat(axis = var_68, interleave = var_1123_interleave_0, values = (var_1117_cast_fp16, key_7_cast_fp16))[name = tensor("op_1123_cast_fp16")]; tensor encoder_layers_3_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(81522496))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82308992))), name = tensor("encoder_layers_3_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_3_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82309184)))]; tensor linear_30_cast_fp16 = linear(bias = encoder_layers_3_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_3_self_attn_linear_q_weight_to_fp16_palettized, x = key_7_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor var_1128 = const()[name = tensor("op_1128"), val = tensor([1, -1, 8, 128])]; tensor q_19_cast_fp16 = reshape(shape = var_1128, x = linear_30_cast_fp16)[name = tensor("q_19_cast_fp16")]; tensor encoder_layers_3_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82311296))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83097792))), name = tensor("encoder_layers_3_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_3_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83097984)))]; tensor linear_31_cast_fp16 = linear(bias = encoder_layers_3_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_3_self_attn_linear_k_weight_to_fp16_palettized, x = input_195_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor var_1133 = const()[name = tensor("op_1133"), val = tensor([1, -1, 8, 128])]; tensor k_13_cast_fp16 = reshape(shape = var_1133, x = linear_31_cast_fp16)[name = tensor("k_13_cast_fp16")]; tensor encoder_layers_3_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83100096))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83886592))), name = tensor("encoder_layers_3_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_3_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83886784)))]; tensor linear_32_cast_fp16 = linear(bias = encoder_layers_3_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_3_self_attn_linear_v_weight_to_fp16_palettized, x = input_195_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor var_1138 = const()[name = tensor("op_1138"), val = tensor([1, -1, 8, 128])]; tensor v_7_cast_fp16 = reshape(shape = var_1138, x = linear_32_cast_fp16)[name = tensor("v_7_cast_fp16")]; tensor value_15_perm_0 = const()[name = tensor("value_15_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_3_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83888896)))]; tensor var_1151_cast_fp16 = add(x = q_19_cast_fp16, y = encoder_layers_3_self_attn_pos_bias_u_to_fp16)[name = tensor("op_1151_cast_fp16")]; tensor encoder_layers_3_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83891008)))]; tensor var_1153_cast_fp16 = add(x = q_19_cast_fp16, y = encoder_layers_3_self_attn_pos_bias_v_to_fp16)[name = tensor("op_1153_cast_fp16")]; tensor q_with_bias_v_7_perm_0 = const()[name = tensor("q_with_bias_v_7_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_85_transpose_x_0 = const()[name = tensor("x_85_transpose_x_0"), val = tensor(false)]; tensor x_85_transpose_y_0 = const()[name = tensor("x_85_transpose_y_0"), val = tensor(false)]; tensor op_1155_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_1155_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83893120))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83992704))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83992512)))]; tensor q_with_bias_v_7_cast_fp16 = transpose(perm = q_with_bias_v_7_perm_0, x = var_1153_cast_fp16)[name = tensor("transpose_335")]; tensor x_85_cast_fp16 = matmul(transpose_x = x_85_transpose_x_0, transpose_y = x_85_transpose_y_0, x = q_with_bias_v_7_cast_fp16, y = op_1155_to_fp16_quantized)[name = tensor("x_85_cast_fp16")]; tensor x_87_pad_0 = const()[name = tensor("x_87_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_87_mode_0 = const()[name = tensor("x_87_mode_0"), val = tensor("constant")]; tensor const_118_to_fp16 = const()[name = tensor("const_118_to_fp16"), val = tensor(0x0p+0)]; tensor x_87_cast_fp16 = pad(constant_val = const_118_to_fp16, mode = x_87_mode_0, pad = x_87_pad_0, x = x_85_cast_fp16)[name = tensor("x_87_cast_fp16")]; tensor var_1163 = const()[name = tensor("op_1163"), val = tensor([1, 8, -1, 7])]; tensor x_89_cast_fp16 = reshape(shape = var_1163, x = x_87_cast_fp16)[name = tensor("x_89_cast_fp16")]; tensor var_1167_begin_0 = const()[name = tensor("op_1167_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_1167_end_0 = const()[name = tensor("op_1167_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_1167_end_mask_0 = const()[name = tensor("op_1167_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_1167_cast_fp16 = slice_by_index(begin = var_1167_begin_0, end = var_1167_end_0, end_mask = var_1167_end_mask_0, x = x_89_cast_fp16)[name = tensor("op_1167_cast_fp16")]; tensor var_1168 = const()[name = tensor("op_1168"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_13_cast_fp16 = reshape(shape = var_1168, x = var_1167_cast_fp16)[name = tensor("matrix_bd_13_cast_fp16")]; tensor matrix_ac_7_transpose_x_0 = const()[name = tensor("matrix_ac_7_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_7_transpose_y_0 = const()[name = tensor("matrix_ac_7_transpose_y_0"), val = tensor(false)]; tensor transpose_102_perm_0 = const()[name = tensor("transpose_102_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_103_perm_0 = const()[name = tensor("transpose_103_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_103 = transpose(perm = transpose_103_perm_0, x = k_13_cast_fp16)[name = tensor("transpose_333")]; tensor transpose_102 = transpose(perm = transpose_102_perm_0, x = var_1151_cast_fp16)[name = tensor("transpose_334")]; tensor matrix_ac_7_cast_fp16 = matmul(transpose_x = matrix_ac_7_transpose_x_0, transpose_y = matrix_ac_7_transpose_y_0, x = transpose_102, y = transpose_103)[name = tensor("matrix_ac_7_cast_fp16")]; tensor matrix_bd_15_begin_0 = const()[name = tensor("matrix_bd_15_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_15_end_0 = const()[name = tensor("matrix_bd_15_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_15_end_mask_0 = const()[name = tensor("matrix_bd_15_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_15_cast_fp16 = slice_by_index(begin = matrix_bd_15_begin_0, end = matrix_bd_15_end_0, end_mask = matrix_bd_15_end_mask_0, x = matrix_bd_13_cast_fp16)[name = tensor("matrix_bd_15_cast_fp16")]; tensor var_1177_cast_fp16 = add(x = matrix_ac_7_cast_fp16, y = matrix_bd_15_cast_fp16)[name = tensor("op_1177_cast_fp16")]; tensor _inversed_scores_13_y_0_to_fp16 = const()[name = tensor("_inversed_scores_13_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_13_cast_fp16 = mul(x = var_1177_cast_fp16, y = _inversed_scores_13_y_0_to_fp16)[name = tensor("_inversed_scores_13_cast_fp16")]; tensor scores_15_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_13_cast_fp16, cond = mask_11)[name = tensor("scores_15_cast_fp16")]; tensor var_1183_cast_fp16 = softmax(axis = var_59, x = scores_15_cast_fp16)[name = tensor("op_1183_cast_fp16")]; tensor input_197_cast_fp16 = select(a = var_44_to_fp16, b = var_1183_cast_fp16, cond = mask_11)[name = tensor("input_197_cast_fp16")]; tensor x_91_transpose_x_0 = const()[name = tensor("x_91_transpose_x_0"), val = tensor(false)]; tensor x_91_transpose_y_0 = const()[name = tensor("x_91_transpose_y_0"), val = tensor(false)]; tensor value_15_cast_fp16 = transpose(perm = value_15_perm_0, x = v_7_cast_fp16)[name = tensor("transpose_332")]; tensor x_91_cast_fp16 = matmul(transpose_x = x_91_transpose_x_0, transpose_y = x_91_transpose_y_0, x = input_197_cast_fp16, y = value_15_cast_fp16)[name = tensor("x_91_cast_fp16")]; tensor var_1187_perm_0 = const()[name = tensor("op_1187_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1188 = const()[name = tensor("op_1188"), val = tensor([1, -1, 1024])]; tensor var_1187_cast_fp16 = transpose(perm = var_1187_perm_0, x = x_91_cast_fp16)[name = tensor("transpose_331")]; tensor input_199_cast_fp16 = reshape(shape = var_1188, x = var_1187_cast_fp16)[name = tensor("input_199_cast_fp16")]; tensor encoder_layers_3_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83993024))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84779520))), name = tensor("encoder_layers_3_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_3_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84779712)))]; tensor linear_34_cast_fp16 = linear(bias = encoder_layers_3_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_3_self_attn_linear_out_weight_to_fp16_palettized, x = input_199_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor input_203_cast_fp16 = add(x = input_193_cast_fp16, y = linear_34_cast_fp16)[name = tensor("input_203_cast_fp16")]; tensor x_95_axes_0 = const()[name = tensor("x_95_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84781824)))]; tensor encoder_layers_3_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84783936)))]; tensor x_95_cast_fp16 = layer_norm(axes = x_95_axes_0, beta = encoder_layers_3_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_3_norm_conv_weight_to_fp16, x = input_203_cast_fp16)[name = tensor("x_95_cast_fp16")]; tensor input_205_perm_0 = const()[name = tensor("input_205_perm_0"), val = tensor([0, 2, 1])]; tensor input_207_pad_type_0 = const()[name = tensor("input_207_pad_type_0"), val = tensor("valid")]; tensor input_207_strides_0 = const()[name = tensor("input_207_strides_0"), val = tensor([1])]; tensor input_207_pad_0 = const()[name = tensor("input_207_pad_0"), val = tensor([0, 0])]; tensor input_207_dilations_0 = const()[name = tensor("input_207_dilations_0"), val = tensor([1])]; tensor input_207_groups_0 = const()[name = tensor("input_207_groups_0"), val = tensor(1)]; tensor encoder_layers_3_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_3_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84786048))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(86883264))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_205_cast_fp16 = transpose(perm = input_205_perm_0, x = x_95_cast_fp16)[name = tensor("transpose_330")]; tensor input_207_cast_fp16 = conv(dilations = input_207_dilations_0, groups = input_207_groups_0, pad = input_207_pad_0, pad_type = input_207_pad_type_0, strides = input_207_strides_0, weight = encoder_layers_3_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_205_cast_fp16)[name = tensor("input_207_cast_fp16")]; tensor x_97_split_num_splits_0 = const()[name = tensor("x_97_split_num_splits_0"), val = tensor(2)]; tensor x_97_split_axis_0 = const()[name = tensor("x_97_split_axis_0"), val = tensor(1)]; tensor x_97_split_cast_fp16_0, tensor x_97_split_cast_fp16_1 = split(axis = x_97_split_axis_0, num_splits = x_97_split_num_splits_0, x = input_207_cast_fp16)[name = tensor("x_97_split_cast_fp16")]; tensor x_97_split_1_sigmoid_cast_fp16 = sigmoid(x = x_97_split_cast_fp16_1)[name = tensor("x_97_split_1_sigmoid_cast_fp16")]; tensor x_97_cast_fp16 = mul(x = x_97_split_cast_fp16_0, y = x_97_split_1_sigmoid_cast_fp16)[name = tensor("x_97_cast_fp16")]; tensor input_209_cast_fp16 = select(a = var_44_to_fp16, b = x_97_cast_fp16, cond = var_575)[name = tensor("input_209_cast_fp16")]; tensor new_x_15_interleave_0 = const()[name = tensor("new_x_15_interleave_0"), val = tensor(false)]; tensor new_x_15_cast_fp16 = concat(axis = var_59, interleave = new_x_15_interleave_0, values = (cache_15_cast_fp16, input_209_cast_fp16))[name = tensor("new_x_15_cast_fp16")]; tensor var_1227_begin_0 = const()[name = tensor("op_1227_begin_0"), val = tensor([0, 0, 7])]; tensor var_1227_end_0 = const()[name = tensor("op_1227_end_0"), val = tensor([1, 1024, 15])]; tensor var_1227_end_mask_0 = const()[name = tensor("op_1227_end_mask_0"), val = tensor([true, true, true])]; tensor var_1227_cast_fp16 = slice_by_index(begin = var_1227_begin_0, end = var_1227_end_0, end_mask = var_1227_end_mask_0, x = new_x_15_cast_fp16)[name = tensor("op_1227_cast_fp16")]; tensor x_99_pad_type_0 = const()[name = tensor("x_99_pad_type_0"), val = tensor("valid")]; tensor x_99_groups_0 = const()[name = tensor("x_99_groups_0"), val = tensor(1024)]; tensor x_99_strides_0 = const()[name = tensor("x_99_strides_0"), val = tensor([1])]; tensor x_99_pad_0 = const()[name = tensor("x_99_pad_0"), val = tensor([0, 0])]; tensor x_99_dilations_0 = const()[name = tensor("x_99_dilations_0"), val = tensor([1])]; tensor encoder_layers_3_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_3_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(86887424))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(86896704))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_99_cast_fp16 = conv(dilations = x_99_dilations_0, groups = x_99_groups_0, pad = x_99_pad_0, pad_type = x_99_pad_type_0, strides = x_99_strides_0, weight = encoder_layers_3_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_15_cast_fp16)[name = tensor("x_99_cast_fp16")]; tensor input_211_perm_0 = const()[name = tensor("input_211_perm_0"), val = tensor([0, 2, 1])]; tensor x_101_axes_0 = const()[name = tensor("x_101_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_3_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(86898816)))]; tensor encoder_layers_3_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_3_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(86900928)))]; tensor input_211_cast_fp16 = transpose(perm = input_211_perm_0, x = x_99_cast_fp16)[name = tensor("transpose_329")]; tensor x_101_cast_fp16 = layer_norm(axes = x_101_axes_0, beta = encoder_layers_3_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_3_conv_batch_norm_weight_to_fp16, x = input_211_cast_fp16)[name = tensor("x_101_cast_fp16")]; tensor input_213_perm_0 = const()[name = tensor("input_213_perm_0"), val = tensor([0, 2, 1])]; tensor input_213_cast_fp16 = transpose(perm = input_213_perm_0, x = x_101_cast_fp16)[name = tensor("transpose_328")]; tensor input_215_cast_fp16 = silu(x = input_213_cast_fp16)[name = tensor("input_215_cast_fp16")]; tensor x_103_pad_type_0 = const()[name = tensor("x_103_pad_type_0"), val = tensor("valid")]; tensor x_103_strides_0 = const()[name = tensor("x_103_strides_0"), val = tensor([1])]; tensor x_103_pad_0 = const()[name = tensor("x_103_pad_0"), val = tensor([0, 0])]; tensor x_103_dilations_0 = const()[name = tensor("x_103_dilations_0"), val = tensor([1])]; tensor x_103_groups_0 = const()[name = tensor("x_103_groups_0"), val = tensor(1)]; tensor encoder_layers_3_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_3_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(86903040))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(87951680))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_103_cast_fp16 = conv(dilations = x_103_dilations_0, groups = x_103_groups_0, pad = x_103_pad_0, pad_type = x_103_pad_type_0, strides = x_103_strides_0, weight = encoder_layers_3_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_215_cast_fp16)[name = tensor("x_103_cast_fp16")]; tensor input_217_perm_0 = const()[name = tensor("input_217_perm_0"), val = tensor([0, 2, 1])]; tensor input_217_cast_fp16 = transpose(perm = input_217_perm_0, x = x_103_cast_fp16)[name = tensor("transpose_327")]; tensor input_219_cast_fp16 = add(x = input_203_cast_fp16, y = input_217_cast_fp16)[name = tensor("input_219_cast_fp16")]; tensor input_221_axes_0 = const()[name = tensor("input_221_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(87953792)))]; tensor encoder_layers_3_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(87955904)))]; tensor input_221_cast_fp16 = layer_norm(axes = input_221_axes_0, beta = encoder_layers_3_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_3_norm_feed_forward2_weight_to_fp16, x = input_219_cast_fp16)[name = tensor("input_221_cast_fp16")]; tensor encoder_layers_3_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(87958016))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91103808))), name = tensor("encoder_layers_3_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_3_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_3_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91104000)))]; tensor linear_35_cast_fp16 = linear(bias = encoder_layers_3_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_3_feed_forward2_linear1_weight_to_fp16_palettized, x = input_221_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor input_225_cast_fp16 = silu(x = linear_35_cast_fp16)[name = tensor("input_225_cast_fp16")]; tensor encoder_layers_3_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91112256))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94258048))), name = tensor("encoder_layers_3_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_3_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_3_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94258240)))]; tensor linear_36_cast_fp16 = linear(bias = encoder_layers_3_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_3_feed_forward2_linear2_weight_to_fp16_palettized, x = input_225_cast_fp16)[name = tensor("linear_36_cast_fp16")]; tensor var_1270_to_fp16 = const()[name = tensor("op_1270_to_fp16"), val = tensor(0x1p-1)]; tensor var_1271_cast_fp16 = mul(x = linear_36_cast_fp16, y = var_1270_to_fp16)[name = tensor("op_1271_cast_fp16")]; tensor input_231_cast_fp16 = add(x = input_219_cast_fp16, y = var_1271_cast_fp16)[name = tensor("input_231_cast_fp16")]; tensor input_233_axes_0 = const()[name = tensor("input_233_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94260352)))]; tensor encoder_layers_3_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94262464)))]; tensor input_233_cast_fp16 = layer_norm(axes = input_233_axes_0, beta = encoder_layers_3_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_3_norm_out_weight_to_fp16, x = input_231_cast_fp16)[name = tensor("input_233_cast_fp16")]; tensor cache_17_begin_0 = const()[name = tensor("cache_17_begin_0"), val = tensor([4, 0, 0, 0])]; tensor cache_17_end_0 = const()[name = tensor("cache_17_end_0"), val = tensor([5, 1, 42, 1024])]; tensor cache_17_end_mask_0 = const()[name = tensor("cache_17_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_17_squeeze_mask_0 = const()[name = tensor("cache_17_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_17_cast_fp16 = slice_by_index(begin = cache_17_begin_0, end = cache_17_end_0, end_mask = cache_17_end_mask_0, squeeze_mask = cache_17_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_17_cast_fp16")]; tensor cache_19_begin_0 = const()[name = tensor("cache_19_begin_0"), val = tensor([4, 0, 0, 0])]; tensor cache_19_end_0 = const()[name = tensor("cache_19_end_0"), val = tensor([5, 1, 1024, 8])]; tensor cache_19_end_mask_0 = const()[name = tensor("cache_19_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_19_squeeze_mask_0 = const()[name = tensor("cache_19_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_19_cast_fp16 = slice_by_index(begin = cache_19_begin_0, end = cache_19_end_0, end_mask = cache_19_end_mask_0, squeeze_mask = cache_19_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_19_cast_fp16")]; tensor input_235_axes_0 = const()[name = tensor("input_235_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94264576)))]; tensor encoder_layers_4_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94266688)))]; tensor input_235_cast_fp16 = layer_norm(axes = input_235_axes_0, beta = encoder_layers_4_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_4_norm_feed_forward1_weight_to_fp16, x = input_233_cast_fp16)[name = tensor("input_235_cast_fp16")]; tensor encoder_layers_4_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94268800))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97414592))), name = tensor("encoder_layers_4_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_4_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_4_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97414784)))]; tensor linear_37_cast_fp16 = linear(bias = encoder_layers_4_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_4_feed_forward1_linear1_weight_to_fp16_palettized, x = input_235_cast_fp16)[name = tensor("linear_37_cast_fp16")]; tensor input_239_cast_fp16 = silu(x = linear_37_cast_fp16)[name = tensor("input_239_cast_fp16")]; tensor encoder_layers_4_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97423040))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100568832))), name = tensor("encoder_layers_4_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_4_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_4_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100569024)))]; tensor linear_38_cast_fp16 = linear(bias = encoder_layers_4_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_4_feed_forward1_linear2_weight_to_fp16_palettized, x = input_239_cast_fp16)[name = tensor("linear_38_cast_fp16")]; tensor var_1307_to_fp16 = const()[name = tensor("op_1307_to_fp16"), val = tensor(0x1p-1)]; tensor var_1308_cast_fp16 = mul(x = linear_38_cast_fp16, y = var_1307_to_fp16)[name = tensor("op_1308_cast_fp16")]; tensor input_245_cast_fp16 = add(x = input_233_cast_fp16, y = var_1308_cast_fp16)[name = tensor("input_245_cast_fp16")]; tensor key_9_axes_0 = const()[name = tensor("key_9_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100571136)))]; tensor encoder_layers_4_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100573248)))]; tensor key_9_cast_fp16 = layer_norm(axes = key_9_axes_0, beta = encoder_layers_4_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_4_norm_self_att_weight_to_fp16, x = input_245_cast_fp16)[name = tensor("key_9_cast_fp16")]; tensor input_247_interleave_0 = const()[name = tensor("input_247_interleave_0"), val = tensor(false)]; tensor input_247_cast_fp16 = concat(axis = var_68, interleave = input_247_interleave_0, values = (cache_17_cast_fp16, key_9_cast_fp16))[name = tensor("input_247_cast_fp16")]; tensor var_1330_begin_0 = const()[name = tensor("op_1330_begin_0"), val = tensor([0, 7, 0])]; tensor var_1330_end_0 = const()[name = tensor("op_1330_end_0"), val = tensor([1, 42, 1024])]; tensor var_1330_end_mask_0 = const()[name = tensor("op_1330_end_mask_0"), val = tensor([true, true, true])]; tensor var_1330_cast_fp16 = slice_by_index(begin = var_1330_begin_0, end = var_1330_end_0, end_mask = var_1330_end_mask_0, x = cache_17_cast_fp16)[name = tensor("op_1330_cast_fp16")]; tensor var_1336_interleave_0 = const()[name = tensor("op_1336_interleave_0"), val = tensor(false)]; tensor var_1336_cast_fp16 = concat(axis = var_68, interleave = var_1336_interleave_0, values = (var_1330_cast_fp16, key_9_cast_fp16))[name = tensor("op_1336_cast_fp16")]; tensor encoder_layers_4_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100575360))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(101361856))), name = tensor("encoder_layers_4_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_4_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(101362048)))]; tensor linear_39_cast_fp16 = linear(bias = encoder_layers_4_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_4_self_attn_linear_q_weight_to_fp16_palettized, x = key_9_cast_fp16)[name = tensor("linear_39_cast_fp16")]; tensor var_1341 = const()[name = tensor("op_1341"), val = tensor([1, -1, 8, 128])]; tensor q_25_cast_fp16 = reshape(shape = var_1341, x = linear_39_cast_fp16)[name = tensor("q_25_cast_fp16")]; tensor encoder_layers_4_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(101364160))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102150656))), name = tensor("encoder_layers_4_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_4_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102150848)))]; tensor linear_40_cast_fp16 = linear(bias = encoder_layers_4_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_4_self_attn_linear_k_weight_to_fp16_palettized, x = input_247_cast_fp16)[name = tensor("linear_40_cast_fp16")]; tensor var_1346 = const()[name = tensor("op_1346"), val = tensor([1, -1, 8, 128])]; tensor k_17_cast_fp16 = reshape(shape = var_1346, x = linear_40_cast_fp16)[name = tensor("k_17_cast_fp16")]; tensor encoder_layers_4_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102152960))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102939456))), name = tensor("encoder_layers_4_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_4_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102939648)))]; tensor linear_41_cast_fp16 = linear(bias = encoder_layers_4_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_4_self_attn_linear_v_weight_to_fp16_palettized, x = input_247_cast_fp16)[name = tensor("linear_41_cast_fp16")]; tensor var_1351 = const()[name = tensor("op_1351"), val = tensor([1, -1, 8, 128])]; tensor v_9_cast_fp16 = reshape(shape = var_1351, x = linear_41_cast_fp16)[name = tensor("v_9_cast_fp16")]; tensor value_17_perm_0 = const()[name = tensor("value_17_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_4_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102941760)))]; tensor var_1364_cast_fp16 = add(x = q_25_cast_fp16, y = encoder_layers_4_self_attn_pos_bias_u_to_fp16)[name = tensor("op_1364_cast_fp16")]; tensor encoder_layers_4_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102943872)))]; tensor var_1366_cast_fp16 = add(x = q_25_cast_fp16, y = encoder_layers_4_self_attn_pos_bias_v_to_fp16)[name = tensor("op_1366_cast_fp16")]; tensor q_with_bias_v_9_perm_0 = const()[name = tensor("q_with_bias_v_9_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_111_transpose_x_0 = const()[name = tensor("x_111_transpose_x_0"), val = tensor(false)]; tensor x_111_transpose_y_0 = const()[name = tensor("x_111_transpose_y_0"), val = tensor(false)]; tensor op_1368_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_1368_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102945984))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103045568))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103045376)))]; tensor q_with_bias_v_9_cast_fp16 = transpose(perm = q_with_bias_v_9_perm_0, x = var_1366_cast_fp16)[name = tensor("transpose_326")]; tensor x_111_cast_fp16 = matmul(transpose_x = x_111_transpose_x_0, transpose_y = x_111_transpose_y_0, x = q_with_bias_v_9_cast_fp16, y = op_1368_to_fp16_quantized)[name = tensor("x_111_cast_fp16")]; tensor x_113_pad_0 = const()[name = tensor("x_113_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_113_mode_0 = const()[name = tensor("x_113_mode_0"), val = tensor("constant")]; tensor const_131_to_fp16 = const()[name = tensor("const_131_to_fp16"), val = tensor(0x0p+0)]; tensor x_113_cast_fp16 = pad(constant_val = const_131_to_fp16, mode = x_113_mode_0, pad = x_113_pad_0, x = x_111_cast_fp16)[name = tensor("x_113_cast_fp16")]; tensor var_1376 = const()[name = tensor("op_1376"), val = tensor([1, 8, -1, 7])]; tensor x_115_cast_fp16 = reshape(shape = var_1376, x = x_113_cast_fp16)[name = tensor("x_115_cast_fp16")]; tensor var_1380_begin_0 = const()[name = tensor("op_1380_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_1380_end_0 = const()[name = tensor("op_1380_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_1380_end_mask_0 = const()[name = tensor("op_1380_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_1380_cast_fp16 = slice_by_index(begin = var_1380_begin_0, end = var_1380_end_0, end_mask = var_1380_end_mask_0, x = x_115_cast_fp16)[name = tensor("op_1380_cast_fp16")]; tensor var_1381 = const()[name = tensor("op_1381"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_17_cast_fp16 = reshape(shape = var_1381, x = var_1380_cast_fp16)[name = tensor("matrix_bd_17_cast_fp16")]; tensor matrix_ac_9_transpose_x_0 = const()[name = tensor("matrix_ac_9_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_9_transpose_y_0 = const()[name = tensor("matrix_ac_9_transpose_y_0"), val = tensor(false)]; tensor transpose_104_perm_0 = const()[name = tensor("transpose_104_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_105_perm_0 = const()[name = tensor("transpose_105_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_105 = transpose(perm = transpose_105_perm_0, x = k_17_cast_fp16)[name = tensor("transpose_324")]; tensor transpose_104 = transpose(perm = transpose_104_perm_0, x = var_1364_cast_fp16)[name = tensor("transpose_325")]; tensor matrix_ac_9_cast_fp16 = matmul(transpose_x = matrix_ac_9_transpose_x_0, transpose_y = matrix_ac_9_transpose_y_0, x = transpose_104, y = transpose_105)[name = tensor("matrix_ac_9_cast_fp16")]; tensor matrix_bd_19_begin_0 = const()[name = tensor("matrix_bd_19_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_19_end_0 = const()[name = tensor("matrix_bd_19_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_19_end_mask_0 = const()[name = tensor("matrix_bd_19_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_19_cast_fp16 = slice_by_index(begin = matrix_bd_19_begin_0, end = matrix_bd_19_end_0, end_mask = matrix_bd_19_end_mask_0, x = matrix_bd_17_cast_fp16)[name = tensor("matrix_bd_19_cast_fp16")]; tensor var_1390_cast_fp16 = add(x = matrix_ac_9_cast_fp16, y = matrix_bd_19_cast_fp16)[name = tensor("op_1390_cast_fp16")]; tensor _inversed_scores_17_y_0_to_fp16 = const()[name = tensor("_inversed_scores_17_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_17_cast_fp16 = mul(x = var_1390_cast_fp16, y = _inversed_scores_17_y_0_to_fp16)[name = tensor("_inversed_scores_17_cast_fp16")]; tensor scores_19_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_17_cast_fp16, cond = mask_11)[name = tensor("scores_19_cast_fp16")]; tensor var_1396_cast_fp16 = softmax(axis = var_59, x = scores_19_cast_fp16)[name = tensor("op_1396_cast_fp16")]; tensor input_249_cast_fp16 = select(a = var_44_to_fp16, b = var_1396_cast_fp16, cond = mask_11)[name = tensor("input_249_cast_fp16")]; tensor x_117_transpose_x_0 = const()[name = tensor("x_117_transpose_x_0"), val = tensor(false)]; tensor x_117_transpose_y_0 = const()[name = tensor("x_117_transpose_y_0"), val = tensor(false)]; tensor value_17_cast_fp16 = transpose(perm = value_17_perm_0, x = v_9_cast_fp16)[name = tensor("transpose_323")]; tensor x_117_cast_fp16 = matmul(transpose_x = x_117_transpose_x_0, transpose_y = x_117_transpose_y_0, x = input_249_cast_fp16, y = value_17_cast_fp16)[name = tensor("x_117_cast_fp16")]; tensor var_1400_perm_0 = const()[name = tensor("op_1400_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1401 = const()[name = tensor("op_1401"), val = tensor([1, -1, 1024])]; tensor var_1400_cast_fp16 = transpose(perm = var_1400_perm_0, x = x_117_cast_fp16)[name = tensor("transpose_322")]; tensor input_251_cast_fp16 = reshape(shape = var_1401, x = var_1400_cast_fp16)[name = tensor("input_251_cast_fp16")]; tensor encoder_layers_4_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103045888))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103832384))), name = tensor("encoder_layers_4_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_4_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103832576)))]; tensor linear_43_cast_fp16 = linear(bias = encoder_layers_4_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_4_self_attn_linear_out_weight_to_fp16_palettized, x = input_251_cast_fp16)[name = tensor("linear_43_cast_fp16")]; tensor input_255_cast_fp16 = add(x = input_245_cast_fp16, y = linear_43_cast_fp16)[name = tensor("input_255_cast_fp16")]; tensor x_121_axes_0 = const()[name = tensor("x_121_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103834688)))]; tensor encoder_layers_4_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103836800)))]; tensor x_121_cast_fp16 = layer_norm(axes = x_121_axes_0, beta = encoder_layers_4_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_4_norm_conv_weight_to_fp16, x = input_255_cast_fp16)[name = tensor("x_121_cast_fp16")]; tensor input_257_perm_0 = const()[name = tensor("input_257_perm_0"), val = tensor([0, 2, 1])]; tensor input_259_pad_type_0 = const()[name = tensor("input_259_pad_type_0"), val = tensor("valid")]; tensor input_259_strides_0 = const()[name = tensor("input_259_strides_0"), val = tensor([1])]; tensor input_259_pad_0 = const()[name = tensor("input_259_pad_0"), val = tensor([0, 0])]; tensor input_259_dilations_0 = const()[name = tensor("input_259_dilations_0"), val = tensor([1])]; tensor input_259_groups_0 = const()[name = tensor("input_259_groups_0"), val = tensor(1)]; tensor encoder_layers_4_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_4_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103838912))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(105936128))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_257_cast_fp16 = transpose(perm = input_257_perm_0, x = x_121_cast_fp16)[name = tensor("transpose_321")]; tensor input_259_cast_fp16 = conv(dilations = input_259_dilations_0, groups = input_259_groups_0, pad = input_259_pad_0, pad_type = input_259_pad_type_0, strides = input_259_strides_0, weight = encoder_layers_4_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_257_cast_fp16)[name = tensor("input_259_cast_fp16")]; tensor x_123_split_num_splits_0 = const()[name = tensor("x_123_split_num_splits_0"), val = tensor(2)]; tensor x_123_split_axis_0 = const()[name = tensor("x_123_split_axis_0"), val = tensor(1)]; tensor x_123_split_cast_fp16_0, tensor x_123_split_cast_fp16_1 = split(axis = x_123_split_axis_0, num_splits = x_123_split_num_splits_0, x = input_259_cast_fp16)[name = tensor("x_123_split_cast_fp16")]; tensor x_123_split_1_sigmoid_cast_fp16 = sigmoid(x = x_123_split_cast_fp16_1)[name = tensor("x_123_split_1_sigmoid_cast_fp16")]; tensor x_123_cast_fp16 = mul(x = x_123_split_cast_fp16_0, y = x_123_split_1_sigmoid_cast_fp16)[name = tensor("x_123_cast_fp16")]; tensor input_261_cast_fp16 = select(a = var_44_to_fp16, b = x_123_cast_fp16, cond = var_575)[name = tensor("input_261_cast_fp16")]; tensor new_x_19_interleave_0 = const()[name = tensor("new_x_19_interleave_0"), val = tensor(false)]; tensor new_x_19_cast_fp16 = concat(axis = var_59, interleave = new_x_19_interleave_0, values = (cache_19_cast_fp16, input_261_cast_fp16))[name = tensor("new_x_19_cast_fp16")]; tensor var_1440_begin_0 = const()[name = tensor("op_1440_begin_0"), val = tensor([0, 0, 7])]; tensor var_1440_end_0 = const()[name = tensor("op_1440_end_0"), val = tensor([1, 1024, 15])]; tensor var_1440_end_mask_0 = const()[name = tensor("op_1440_end_mask_0"), val = tensor([true, true, true])]; tensor var_1440_cast_fp16 = slice_by_index(begin = var_1440_begin_0, end = var_1440_end_0, end_mask = var_1440_end_mask_0, x = new_x_19_cast_fp16)[name = tensor("op_1440_cast_fp16")]; tensor x_125_pad_type_0 = const()[name = tensor("x_125_pad_type_0"), val = tensor("valid")]; tensor x_125_groups_0 = const()[name = tensor("x_125_groups_0"), val = tensor(1024)]; tensor x_125_strides_0 = const()[name = tensor("x_125_strides_0"), val = tensor([1])]; tensor x_125_pad_0 = const()[name = tensor("x_125_pad_0"), val = tensor([0, 0])]; tensor x_125_dilations_0 = const()[name = tensor("x_125_dilations_0"), val = tensor([1])]; tensor encoder_layers_4_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_4_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(105940288))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(105949568))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_125_cast_fp16 = conv(dilations = x_125_dilations_0, groups = x_125_groups_0, pad = x_125_pad_0, pad_type = x_125_pad_type_0, strides = x_125_strides_0, weight = encoder_layers_4_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_19_cast_fp16)[name = tensor("x_125_cast_fp16")]; tensor input_263_perm_0 = const()[name = tensor("input_263_perm_0"), val = tensor([0, 2, 1])]; tensor x_127_axes_0 = const()[name = tensor("x_127_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_4_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(105951680)))]; tensor encoder_layers_4_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_4_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(105953792)))]; tensor input_263_cast_fp16 = transpose(perm = input_263_perm_0, x = x_125_cast_fp16)[name = tensor("transpose_320")]; tensor x_127_cast_fp16 = layer_norm(axes = x_127_axes_0, beta = encoder_layers_4_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_4_conv_batch_norm_weight_to_fp16, x = input_263_cast_fp16)[name = tensor("x_127_cast_fp16")]; tensor input_265_perm_0 = const()[name = tensor("input_265_perm_0"), val = tensor([0, 2, 1])]; tensor input_265_cast_fp16 = transpose(perm = input_265_perm_0, x = x_127_cast_fp16)[name = tensor("transpose_319")]; tensor input_267_cast_fp16 = silu(x = input_265_cast_fp16)[name = tensor("input_267_cast_fp16")]; tensor x_129_pad_type_0 = const()[name = tensor("x_129_pad_type_0"), val = tensor("valid")]; tensor x_129_strides_0 = const()[name = tensor("x_129_strides_0"), val = tensor([1])]; tensor x_129_pad_0 = const()[name = tensor("x_129_pad_0"), val = tensor([0, 0])]; tensor x_129_dilations_0 = const()[name = tensor("x_129_dilations_0"), val = tensor([1])]; tensor x_129_groups_0 = const()[name = tensor("x_129_groups_0"), val = tensor(1)]; tensor encoder_layers_4_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_4_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(105955904))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(107004544))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_129_cast_fp16 = conv(dilations = x_129_dilations_0, groups = x_129_groups_0, pad = x_129_pad_0, pad_type = x_129_pad_type_0, strides = x_129_strides_0, weight = encoder_layers_4_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_267_cast_fp16)[name = tensor("x_129_cast_fp16")]; tensor input_269_perm_0 = const()[name = tensor("input_269_perm_0"), val = tensor([0, 2, 1])]; tensor input_269_cast_fp16 = transpose(perm = input_269_perm_0, x = x_129_cast_fp16)[name = tensor("transpose_318")]; tensor input_271_cast_fp16 = add(x = input_255_cast_fp16, y = input_269_cast_fp16)[name = tensor("input_271_cast_fp16")]; tensor input_273_axes_0 = const()[name = tensor("input_273_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(107006656)))]; tensor encoder_layers_4_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(107008768)))]; tensor input_273_cast_fp16 = layer_norm(axes = input_273_axes_0, beta = encoder_layers_4_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_4_norm_feed_forward2_weight_to_fp16, x = input_271_cast_fp16)[name = tensor("input_273_cast_fp16")]; tensor encoder_layers_4_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(107010880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110156672))), name = tensor("encoder_layers_4_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_4_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_4_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110156864)))]; tensor linear_44_cast_fp16 = linear(bias = encoder_layers_4_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_4_feed_forward2_linear1_weight_to_fp16_palettized, x = input_273_cast_fp16)[name = tensor("linear_44_cast_fp16")]; tensor input_277_cast_fp16 = silu(x = linear_44_cast_fp16)[name = tensor("input_277_cast_fp16")]; tensor encoder_layers_4_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110165120))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113310912))), name = tensor("encoder_layers_4_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_4_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_4_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113311104)))]; tensor linear_45_cast_fp16 = linear(bias = encoder_layers_4_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_4_feed_forward2_linear2_weight_to_fp16_palettized, x = input_277_cast_fp16)[name = tensor("linear_45_cast_fp16")]; tensor var_1483_to_fp16 = const()[name = tensor("op_1483_to_fp16"), val = tensor(0x1p-1)]; tensor var_1484_cast_fp16 = mul(x = linear_45_cast_fp16, y = var_1483_to_fp16)[name = tensor("op_1484_cast_fp16")]; tensor input_283_cast_fp16 = add(x = input_271_cast_fp16, y = var_1484_cast_fp16)[name = tensor("input_283_cast_fp16")]; tensor input_285_axes_0 = const()[name = tensor("input_285_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113313216)))]; tensor encoder_layers_4_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113315328)))]; tensor input_285_cast_fp16 = layer_norm(axes = input_285_axes_0, beta = encoder_layers_4_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_4_norm_out_weight_to_fp16, x = input_283_cast_fp16)[name = tensor("input_285_cast_fp16")]; tensor cache_21_begin_0 = const()[name = tensor("cache_21_begin_0"), val = tensor([5, 0, 0, 0])]; tensor cache_21_end_0 = const()[name = tensor("cache_21_end_0"), val = tensor([6, 1, 42, 1024])]; tensor cache_21_end_mask_0 = const()[name = tensor("cache_21_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_21_squeeze_mask_0 = const()[name = tensor("cache_21_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_21_cast_fp16 = slice_by_index(begin = cache_21_begin_0, end = cache_21_end_0, end_mask = cache_21_end_mask_0, squeeze_mask = cache_21_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_21_cast_fp16")]; tensor cache_23_begin_0 = const()[name = tensor("cache_23_begin_0"), val = tensor([5, 0, 0, 0])]; tensor cache_23_end_0 = const()[name = tensor("cache_23_end_0"), val = tensor([6, 1, 1024, 8])]; tensor cache_23_end_mask_0 = const()[name = tensor("cache_23_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_23_squeeze_mask_0 = const()[name = tensor("cache_23_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_23_cast_fp16 = slice_by_index(begin = cache_23_begin_0, end = cache_23_end_0, end_mask = cache_23_end_mask_0, squeeze_mask = cache_23_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_23_cast_fp16")]; tensor input_287_axes_0 = const()[name = tensor("input_287_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113317440)))]; tensor encoder_layers_5_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113319552)))]; tensor input_287_cast_fp16 = layer_norm(axes = input_287_axes_0, beta = encoder_layers_5_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_5_norm_feed_forward1_weight_to_fp16, x = input_285_cast_fp16)[name = tensor("input_287_cast_fp16")]; tensor encoder_layers_5_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113321664))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116467456))), name = tensor("encoder_layers_5_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_5_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_5_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116467648)))]; tensor linear_46_cast_fp16 = linear(bias = encoder_layers_5_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_5_feed_forward1_linear1_weight_to_fp16_palettized, x = input_287_cast_fp16)[name = tensor("linear_46_cast_fp16")]; tensor input_291_cast_fp16 = silu(x = linear_46_cast_fp16)[name = tensor("input_291_cast_fp16")]; tensor encoder_layers_5_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116475904))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119621696))), name = tensor("encoder_layers_5_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_5_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_5_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119621888)))]; tensor linear_47_cast_fp16 = linear(bias = encoder_layers_5_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_5_feed_forward1_linear2_weight_to_fp16_palettized, x = input_291_cast_fp16)[name = tensor("linear_47_cast_fp16")]; tensor var_1520_to_fp16 = const()[name = tensor("op_1520_to_fp16"), val = tensor(0x1p-1)]; tensor var_1521_cast_fp16 = mul(x = linear_47_cast_fp16, y = var_1520_to_fp16)[name = tensor("op_1521_cast_fp16")]; tensor input_297_cast_fp16 = add(x = input_285_cast_fp16, y = var_1521_cast_fp16)[name = tensor("input_297_cast_fp16")]; tensor key_11_axes_0 = const()[name = tensor("key_11_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119624000)))]; tensor encoder_layers_5_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119626112)))]; tensor key_11_cast_fp16 = layer_norm(axes = key_11_axes_0, beta = encoder_layers_5_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_5_norm_self_att_weight_to_fp16, x = input_297_cast_fp16)[name = tensor("key_11_cast_fp16")]; tensor input_299_interleave_0 = const()[name = tensor("input_299_interleave_0"), val = tensor(false)]; tensor input_299_cast_fp16 = concat(axis = var_68, interleave = input_299_interleave_0, values = (cache_21_cast_fp16, key_11_cast_fp16))[name = tensor("input_299_cast_fp16")]; tensor var_1543_begin_0 = const()[name = tensor("op_1543_begin_0"), val = tensor([0, 7, 0])]; tensor var_1543_end_0 = const()[name = tensor("op_1543_end_0"), val = tensor([1, 42, 1024])]; tensor var_1543_end_mask_0 = const()[name = tensor("op_1543_end_mask_0"), val = tensor([true, true, true])]; tensor var_1543_cast_fp16 = slice_by_index(begin = var_1543_begin_0, end = var_1543_end_0, end_mask = var_1543_end_mask_0, x = cache_21_cast_fp16)[name = tensor("op_1543_cast_fp16")]; tensor var_1549_interleave_0 = const()[name = tensor("op_1549_interleave_0"), val = tensor(false)]; tensor var_1549_cast_fp16 = concat(axis = var_68, interleave = var_1549_interleave_0, values = (var_1543_cast_fp16, key_11_cast_fp16))[name = tensor("op_1549_cast_fp16")]; tensor encoder_layers_5_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119628224))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(120414720))), name = tensor("encoder_layers_5_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_5_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(120414912)))]; tensor linear_48_cast_fp16 = linear(bias = encoder_layers_5_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_5_self_attn_linear_q_weight_to_fp16_palettized, x = key_11_cast_fp16)[name = tensor("linear_48_cast_fp16")]; tensor var_1554 = const()[name = tensor("op_1554"), val = tensor([1, -1, 8, 128])]; tensor q_31_cast_fp16 = reshape(shape = var_1554, x = linear_48_cast_fp16)[name = tensor("q_31_cast_fp16")]; tensor encoder_layers_5_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(120417024))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121203520))), name = tensor("encoder_layers_5_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_5_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121203712)))]; tensor linear_49_cast_fp16 = linear(bias = encoder_layers_5_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_5_self_attn_linear_k_weight_to_fp16_palettized, x = input_299_cast_fp16)[name = tensor("linear_49_cast_fp16")]; tensor var_1559 = const()[name = tensor("op_1559"), val = tensor([1, -1, 8, 128])]; tensor k_21_cast_fp16 = reshape(shape = var_1559, x = linear_49_cast_fp16)[name = tensor("k_21_cast_fp16")]; tensor encoder_layers_5_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121205824))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121992320))), name = tensor("encoder_layers_5_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_5_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121992512)))]; tensor linear_50_cast_fp16 = linear(bias = encoder_layers_5_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_5_self_attn_linear_v_weight_to_fp16_palettized, x = input_299_cast_fp16)[name = tensor("linear_50_cast_fp16")]; tensor var_1564 = const()[name = tensor("op_1564"), val = tensor([1, -1, 8, 128])]; tensor v_11_cast_fp16 = reshape(shape = var_1564, x = linear_50_cast_fp16)[name = tensor("v_11_cast_fp16")]; tensor value_19_perm_0 = const()[name = tensor("value_19_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_5_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121994624)))]; tensor var_1577_cast_fp16 = add(x = q_31_cast_fp16, y = encoder_layers_5_self_attn_pos_bias_u_to_fp16)[name = tensor("op_1577_cast_fp16")]; tensor encoder_layers_5_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121996736)))]; tensor var_1579_cast_fp16 = add(x = q_31_cast_fp16, y = encoder_layers_5_self_attn_pos_bias_v_to_fp16)[name = tensor("op_1579_cast_fp16")]; tensor q_with_bias_v_11_perm_0 = const()[name = tensor("q_with_bias_v_11_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_137_transpose_x_0 = const()[name = tensor("x_137_transpose_x_0"), val = tensor(false)]; tensor x_137_transpose_y_0 = const()[name = tensor("x_137_transpose_y_0"), val = tensor(false)]; tensor op_1581_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_1581_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121998848))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122098432))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122098240)))]; tensor q_with_bias_v_11_cast_fp16 = transpose(perm = q_with_bias_v_11_perm_0, x = var_1579_cast_fp16)[name = tensor("transpose_317")]; tensor x_137_cast_fp16 = matmul(transpose_x = x_137_transpose_x_0, transpose_y = x_137_transpose_y_0, x = q_with_bias_v_11_cast_fp16, y = op_1581_to_fp16_quantized)[name = tensor("x_137_cast_fp16")]; tensor x_139_pad_0 = const()[name = tensor("x_139_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_139_mode_0 = const()[name = tensor("x_139_mode_0"), val = tensor("constant")]; tensor const_144_to_fp16 = const()[name = tensor("const_144_to_fp16"), val = tensor(0x0p+0)]; tensor x_139_cast_fp16 = pad(constant_val = const_144_to_fp16, mode = x_139_mode_0, pad = x_139_pad_0, x = x_137_cast_fp16)[name = tensor("x_139_cast_fp16")]; tensor var_1589 = const()[name = tensor("op_1589"), val = tensor([1, 8, -1, 7])]; tensor x_141_cast_fp16 = reshape(shape = var_1589, x = x_139_cast_fp16)[name = tensor("x_141_cast_fp16")]; tensor var_1593_begin_0 = const()[name = tensor("op_1593_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_1593_end_0 = const()[name = tensor("op_1593_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_1593_end_mask_0 = const()[name = tensor("op_1593_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_1593_cast_fp16 = slice_by_index(begin = var_1593_begin_0, end = var_1593_end_0, end_mask = var_1593_end_mask_0, x = x_141_cast_fp16)[name = tensor("op_1593_cast_fp16")]; tensor var_1594 = const()[name = tensor("op_1594"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_21_cast_fp16 = reshape(shape = var_1594, x = var_1593_cast_fp16)[name = tensor("matrix_bd_21_cast_fp16")]; tensor matrix_ac_11_transpose_x_0 = const()[name = tensor("matrix_ac_11_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_11_transpose_y_0 = const()[name = tensor("matrix_ac_11_transpose_y_0"), val = tensor(false)]; tensor transpose_106_perm_0 = const()[name = tensor("transpose_106_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_107_perm_0 = const()[name = tensor("transpose_107_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_107 = transpose(perm = transpose_107_perm_0, x = k_21_cast_fp16)[name = tensor("transpose_315")]; tensor transpose_106 = transpose(perm = transpose_106_perm_0, x = var_1577_cast_fp16)[name = tensor("transpose_316")]; tensor matrix_ac_11_cast_fp16 = matmul(transpose_x = matrix_ac_11_transpose_x_0, transpose_y = matrix_ac_11_transpose_y_0, x = transpose_106, y = transpose_107)[name = tensor("matrix_ac_11_cast_fp16")]; tensor matrix_bd_23_begin_0 = const()[name = tensor("matrix_bd_23_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_23_end_0 = const()[name = tensor("matrix_bd_23_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_23_end_mask_0 = const()[name = tensor("matrix_bd_23_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_23_cast_fp16 = slice_by_index(begin = matrix_bd_23_begin_0, end = matrix_bd_23_end_0, end_mask = matrix_bd_23_end_mask_0, x = matrix_bd_21_cast_fp16)[name = tensor("matrix_bd_23_cast_fp16")]; tensor var_1603_cast_fp16 = add(x = matrix_ac_11_cast_fp16, y = matrix_bd_23_cast_fp16)[name = tensor("op_1603_cast_fp16")]; tensor _inversed_scores_21_y_0_to_fp16 = const()[name = tensor("_inversed_scores_21_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_21_cast_fp16 = mul(x = var_1603_cast_fp16, y = _inversed_scores_21_y_0_to_fp16)[name = tensor("_inversed_scores_21_cast_fp16")]; tensor scores_23_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_21_cast_fp16, cond = mask_11)[name = tensor("scores_23_cast_fp16")]; tensor var_1609_cast_fp16 = softmax(axis = var_59, x = scores_23_cast_fp16)[name = tensor("op_1609_cast_fp16")]; tensor input_301_cast_fp16 = select(a = var_44_to_fp16, b = var_1609_cast_fp16, cond = mask_11)[name = tensor("input_301_cast_fp16")]; tensor x_143_transpose_x_0 = const()[name = tensor("x_143_transpose_x_0"), val = tensor(false)]; tensor x_143_transpose_y_0 = const()[name = tensor("x_143_transpose_y_0"), val = tensor(false)]; tensor value_19_cast_fp16 = transpose(perm = value_19_perm_0, x = v_11_cast_fp16)[name = tensor("transpose_314")]; tensor x_143_cast_fp16 = matmul(transpose_x = x_143_transpose_x_0, transpose_y = x_143_transpose_y_0, x = input_301_cast_fp16, y = value_19_cast_fp16)[name = tensor("x_143_cast_fp16")]; tensor var_1613_perm_0 = const()[name = tensor("op_1613_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1614 = const()[name = tensor("op_1614"), val = tensor([1, -1, 1024])]; tensor var_1613_cast_fp16 = transpose(perm = var_1613_perm_0, x = x_143_cast_fp16)[name = tensor("transpose_313")]; tensor input_303_cast_fp16 = reshape(shape = var_1614, x = var_1613_cast_fp16)[name = tensor("input_303_cast_fp16")]; tensor encoder_layers_5_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122098752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122885248))), name = tensor("encoder_layers_5_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_5_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122885440)))]; tensor linear_52_cast_fp16 = linear(bias = encoder_layers_5_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_5_self_attn_linear_out_weight_to_fp16_palettized, x = input_303_cast_fp16)[name = tensor("linear_52_cast_fp16")]; tensor input_307_cast_fp16 = add(x = input_297_cast_fp16, y = linear_52_cast_fp16)[name = tensor("input_307_cast_fp16")]; tensor x_147_axes_0 = const()[name = tensor("x_147_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122887552)))]; tensor encoder_layers_5_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122889664)))]; tensor x_147_cast_fp16 = layer_norm(axes = x_147_axes_0, beta = encoder_layers_5_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_5_norm_conv_weight_to_fp16, x = input_307_cast_fp16)[name = tensor("x_147_cast_fp16")]; tensor input_309_perm_0 = const()[name = tensor("input_309_perm_0"), val = tensor([0, 2, 1])]; tensor input_311_pad_type_0 = const()[name = tensor("input_311_pad_type_0"), val = tensor("valid")]; tensor input_311_strides_0 = const()[name = tensor("input_311_strides_0"), val = tensor([1])]; tensor input_311_pad_0 = const()[name = tensor("input_311_pad_0"), val = tensor([0, 0])]; tensor input_311_dilations_0 = const()[name = tensor("input_311_dilations_0"), val = tensor([1])]; tensor input_311_groups_0 = const()[name = tensor("input_311_groups_0"), val = tensor(1)]; tensor encoder_layers_5_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_5_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122891776))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124988992))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_309_cast_fp16 = transpose(perm = input_309_perm_0, x = x_147_cast_fp16)[name = tensor("transpose_312")]; tensor input_311_cast_fp16 = conv(dilations = input_311_dilations_0, groups = input_311_groups_0, pad = input_311_pad_0, pad_type = input_311_pad_type_0, strides = input_311_strides_0, weight = encoder_layers_5_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_309_cast_fp16)[name = tensor("input_311_cast_fp16")]; tensor x_149_split_num_splits_0 = const()[name = tensor("x_149_split_num_splits_0"), val = tensor(2)]; tensor x_149_split_axis_0 = const()[name = tensor("x_149_split_axis_0"), val = tensor(1)]; tensor x_149_split_cast_fp16_0, tensor x_149_split_cast_fp16_1 = split(axis = x_149_split_axis_0, num_splits = x_149_split_num_splits_0, x = input_311_cast_fp16)[name = tensor("x_149_split_cast_fp16")]; tensor x_149_split_1_sigmoid_cast_fp16 = sigmoid(x = x_149_split_cast_fp16_1)[name = tensor("x_149_split_1_sigmoid_cast_fp16")]; tensor x_149_cast_fp16 = mul(x = x_149_split_cast_fp16_0, y = x_149_split_1_sigmoid_cast_fp16)[name = tensor("x_149_cast_fp16")]; tensor input_313_cast_fp16 = select(a = var_44_to_fp16, b = x_149_cast_fp16, cond = var_575)[name = tensor("input_313_cast_fp16")]; tensor new_x_23_interleave_0 = const()[name = tensor("new_x_23_interleave_0"), val = tensor(false)]; tensor new_x_23_cast_fp16 = concat(axis = var_59, interleave = new_x_23_interleave_0, values = (cache_23_cast_fp16, input_313_cast_fp16))[name = tensor("new_x_23_cast_fp16")]; tensor var_1653_begin_0 = const()[name = tensor("op_1653_begin_0"), val = tensor([0, 0, 7])]; tensor var_1653_end_0 = const()[name = tensor("op_1653_end_0"), val = tensor([1, 1024, 15])]; tensor var_1653_end_mask_0 = const()[name = tensor("op_1653_end_mask_0"), val = tensor([true, true, true])]; tensor var_1653_cast_fp16 = slice_by_index(begin = var_1653_begin_0, end = var_1653_end_0, end_mask = var_1653_end_mask_0, x = new_x_23_cast_fp16)[name = tensor("op_1653_cast_fp16")]; tensor x_151_pad_type_0 = const()[name = tensor("x_151_pad_type_0"), val = tensor("valid")]; tensor x_151_groups_0 = const()[name = tensor("x_151_groups_0"), val = tensor(1024)]; tensor x_151_strides_0 = const()[name = tensor("x_151_strides_0"), val = tensor([1])]; tensor x_151_pad_0 = const()[name = tensor("x_151_pad_0"), val = tensor([0, 0])]; tensor x_151_dilations_0 = const()[name = tensor("x_151_dilations_0"), val = tensor([1])]; tensor encoder_layers_5_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_5_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124993152))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(125002432))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_151_cast_fp16 = conv(dilations = x_151_dilations_0, groups = x_151_groups_0, pad = x_151_pad_0, pad_type = x_151_pad_type_0, strides = x_151_strides_0, weight = encoder_layers_5_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_23_cast_fp16)[name = tensor("x_151_cast_fp16")]; tensor input_315_perm_0 = const()[name = tensor("input_315_perm_0"), val = tensor([0, 2, 1])]; tensor x_153_axes_0 = const()[name = tensor("x_153_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_5_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(125004544)))]; tensor encoder_layers_5_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_5_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(125006656)))]; tensor input_315_cast_fp16 = transpose(perm = input_315_perm_0, x = x_151_cast_fp16)[name = tensor("transpose_311")]; tensor x_153_cast_fp16 = layer_norm(axes = x_153_axes_0, beta = encoder_layers_5_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_5_conv_batch_norm_weight_to_fp16, x = input_315_cast_fp16)[name = tensor("x_153_cast_fp16")]; tensor input_317_perm_0 = const()[name = tensor("input_317_perm_0"), val = tensor([0, 2, 1])]; tensor input_317_cast_fp16 = transpose(perm = input_317_perm_0, x = x_153_cast_fp16)[name = tensor("transpose_310")]; tensor input_319_cast_fp16 = silu(x = input_317_cast_fp16)[name = tensor("input_319_cast_fp16")]; tensor x_155_pad_type_0 = const()[name = tensor("x_155_pad_type_0"), val = tensor("valid")]; tensor x_155_strides_0 = const()[name = tensor("x_155_strides_0"), val = tensor([1])]; tensor x_155_pad_0 = const()[name = tensor("x_155_pad_0"), val = tensor([0, 0])]; tensor x_155_dilations_0 = const()[name = tensor("x_155_dilations_0"), val = tensor([1])]; tensor x_155_groups_0 = const()[name = tensor("x_155_groups_0"), val = tensor(1)]; tensor encoder_layers_5_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_5_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(125008768))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(126057408))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_155_cast_fp16 = conv(dilations = x_155_dilations_0, groups = x_155_groups_0, pad = x_155_pad_0, pad_type = x_155_pad_type_0, strides = x_155_strides_0, weight = encoder_layers_5_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_319_cast_fp16)[name = tensor("x_155_cast_fp16")]; tensor input_321_perm_0 = const()[name = tensor("input_321_perm_0"), val = tensor([0, 2, 1])]; tensor input_321_cast_fp16 = transpose(perm = input_321_perm_0, x = x_155_cast_fp16)[name = tensor("transpose_309")]; tensor input_323_cast_fp16 = add(x = input_307_cast_fp16, y = input_321_cast_fp16)[name = tensor("input_323_cast_fp16")]; tensor input_325_axes_0 = const()[name = tensor("input_325_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(126059520)))]; tensor encoder_layers_5_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(126061632)))]; tensor input_325_cast_fp16 = layer_norm(axes = input_325_axes_0, beta = encoder_layers_5_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_5_norm_feed_forward2_weight_to_fp16, x = input_323_cast_fp16)[name = tensor("input_325_cast_fp16")]; tensor encoder_layers_5_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(126063744))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(129209536))), name = tensor("encoder_layers_5_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_5_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_5_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(129209728)))]; tensor linear_53_cast_fp16 = linear(bias = encoder_layers_5_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_5_feed_forward2_linear1_weight_to_fp16_palettized, x = input_325_cast_fp16)[name = tensor("linear_53_cast_fp16")]; tensor input_329_cast_fp16 = silu(x = linear_53_cast_fp16)[name = tensor("input_329_cast_fp16")]; tensor encoder_layers_5_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(129217984))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132363776))), name = tensor("encoder_layers_5_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_5_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_5_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132363968)))]; tensor linear_54_cast_fp16 = linear(bias = encoder_layers_5_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_5_feed_forward2_linear2_weight_to_fp16_palettized, x = input_329_cast_fp16)[name = tensor("linear_54_cast_fp16")]; tensor var_1696_to_fp16 = const()[name = tensor("op_1696_to_fp16"), val = tensor(0x1p-1)]; tensor var_1697_cast_fp16 = mul(x = linear_54_cast_fp16, y = var_1696_to_fp16)[name = tensor("op_1697_cast_fp16")]; tensor input_335_cast_fp16 = add(x = input_323_cast_fp16, y = var_1697_cast_fp16)[name = tensor("input_335_cast_fp16")]; tensor input_337_axes_0 = const()[name = tensor("input_337_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132366080)))]; tensor encoder_layers_5_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132368192)))]; tensor input_337_cast_fp16 = layer_norm(axes = input_337_axes_0, beta = encoder_layers_5_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_5_norm_out_weight_to_fp16, x = input_335_cast_fp16)[name = tensor("input_337_cast_fp16")]; tensor cache_25_begin_0 = const()[name = tensor("cache_25_begin_0"), val = tensor([6, 0, 0, 0])]; tensor cache_25_end_0 = const()[name = tensor("cache_25_end_0"), val = tensor([7, 1, 42, 1024])]; tensor cache_25_end_mask_0 = const()[name = tensor("cache_25_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_25_squeeze_mask_0 = const()[name = tensor("cache_25_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_25_cast_fp16 = slice_by_index(begin = cache_25_begin_0, end = cache_25_end_0, end_mask = cache_25_end_mask_0, squeeze_mask = cache_25_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_25_cast_fp16")]; tensor cache_27_begin_0 = const()[name = tensor("cache_27_begin_0"), val = tensor([6, 0, 0, 0])]; tensor cache_27_end_0 = const()[name = tensor("cache_27_end_0"), val = tensor([7, 1, 1024, 8])]; tensor cache_27_end_mask_0 = const()[name = tensor("cache_27_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_27_squeeze_mask_0 = const()[name = tensor("cache_27_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_27_cast_fp16 = slice_by_index(begin = cache_27_begin_0, end = cache_27_end_0, end_mask = cache_27_end_mask_0, squeeze_mask = cache_27_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_27_cast_fp16")]; tensor input_339_axes_0 = const()[name = tensor("input_339_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132370304)))]; tensor encoder_layers_6_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132372416)))]; tensor input_339_cast_fp16 = layer_norm(axes = input_339_axes_0, beta = encoder_layers_6_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_6_norm_feed_forward1_weight_to_fp16, x = input_337_cast_fp16)[name = tensor("input_339_cast_fp16")]; tensor encoder_layers_6_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132374528))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135520320))), name = tensor("encoder_layers_6_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_6_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_6_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135520512)))]; tensor linear_55_cast_fp16 = linear(bias = encoder_layers_6_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_6_feed_forward1_linear1_weight_to_fp16_palettized, x = input_339_cast_fp16)[name = tensor("linear_55_cast_fp16")]; tensor input_343_cast_fp16 = silu(x = linear_55_cast_fp16)[name = tensor("input_343_cast_fp16")]; tensor encoder_layers_6_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135528768))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(138674560))), name = tensor("encoder_layers_6_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_6_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_6_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(138674752)))]; tensor linear_56_cast_fp16 = linear(bias = encoder_layers_6_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_6_feed_forward1_linear2_weight_to_fp16_palettized, x = input_343_cast_fp16)[name = tensor("linear_56_cast_fp16")]; tensor var_1733_to_fp16 = const()[name = tensor("op_1733_to_fp16"), val = tensor(0x1p-1)]; tensor var_1734_cast_fp16 = mul(x = linear_56_cast_fp16, y = var_1733_to_fp16)[name = tensor("op_1734_cast_fp16")]; tensor input_349_cast_fp16 = add(x = input_337_cast_fp16, y = var_1734_cast_fp16)[name = tensor("input_349_cast_fp16")]; tensor key_13_axes_0 = const()[name = tensor("key_13_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(138676864)))]; tensor encoder_layers_6_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(138678976)))]; tensor key_13_cast_fp16 = layer_norm(axes = key_13_axes_0, beta = encoder_layers_6_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_6_norm_self_att_weight_to_fp16, x = input_349_cast_fp16)[name = tensor("key_13_cast_fp16")]; tensor input_351_interleave_0 = const()[name = tensor("input_351_interleave_0"), val = tensor(false)]; tensor input_351_cast_fp16 = concat(axis = var_68, interleave = input_351_interleave_0, values = (cache_25_cast_fp16, key_13_cast_fp16))[name = tensor("input_351_cast_fp16")]; tensor var_1756_begin_0 = const()[name = tensor("op_1756_begin_0"), val = tensor([0, 7, 0])]; tensor var_1756_end_0 = const()[name = tensor("op_1756_end_0"), val = tensor([1, 42, 1024])]; tensor var_1756_end_mask_0 = const()[name = tensor("op_1756_end_mask_0"), val = tensor([true, true, true])]; tensor var_1756_cast_fp16 = slice_by_index(begin = var_1756_begin_0, end = var_1756_end_0, end_mask = var_1756_end_mask_0, x = cache_25_cast_fp16)[name = tensor("op_1756_cast_fp16")]; tensor var_1762_interleave_0 = const()[name = tensor("op_1762_interleave_0"), val = tensor(false)]; tensor var_1762_cast_fp16 = concat(axis = var_68, interleave = var_1762_interleave_0, values = (var_1756_cast_fp16, key_13_cast_fp16))[name = tensor("op_1762_cast_fp16")]; tensor encoder_layers_6_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(138681088))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139467584))), name = tensor("encoder_layers_6_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_6_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139467776)))]; tensor linear_57_cast_fp16 = linear(bias = encoder_layers_6_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_6_self_attn_linear_q_weight_to_fp16_palettized, x = key_13_cast_fp16)[name = tensor("linear_57_cast_fp16")]; tensor var_1767 = const()[name = tensor("op_1767"), val = tensor([1, -1, 8, 128])]; tensor q_37_cast_fp16 = reshape(shape = var_1767, x = linear_57_cast_fp16)[name = tensor("q_37_cast_fp16")]; tensor encoder_layers_6_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139469888))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140256384))), name = tensor("encoder_layers_6_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_6_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140256576)))]; tensor linear_58_cast_fp16 = linear(bias = encoder_layers_6_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_6_self_attn_linear_k_weight_to_fp16_palettized, x = input_351_cast_fp16)[name = tensor("linear_58_cast_fp16")]; tensor var_1772 = const()[name = tensor("op_1772"), val = tensor([1, -1, 8, 128])]; tensor k_25_cast_fp16 = reshape(shape = var_1772, x = linear_58_cast_fp16)[name = tensor("k_25_cast_fp16")]; tensor encoder_layers_6_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140258688))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141045184))), name = tensor("encoder_layers_6_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_6_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141045376)))]; tensor linear_59_cast_fp16 = linear(bias = encoder_layers_6_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_6_self_attn_linear_v_weight_to_fp16_palettized, x = input_351_cast_fp16)[name = tensor("linear_59_cast_fp16")]; tensor var_1777 = const()[name = tensor("op_1777"), val = tensor([1, -1, 8, 128])]; tensor v_13_cast_fp16 = reshape(shape = var_1777, x = linear_59_cast_fp16)[name = tensor("v_13_cast_fp16")]; tensor value_21_perm_0 = const()[name = tensor("value_21_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_6_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141047488)))]; tensor var_1790_cast_fp16 = add(x = q_37_cast_fp16, y = encoder_layers_6_self_attn_pos_bias_u_to_fp16)[name = tensor("op_1790_cast_fp16")]; tensor encoder_layers_6_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141049600)))]; tensor var_1792_cast_fp16 = add(x = q_37_cast_fp16, y = encoder_layers_6_self_attn_pos_bias_v_to_fp16)[name = tensor("op_1792_cast_fp16")]; tensor q_with_bias_v_13_perm_0 = const()[name = tensor("q_with_bias_v_13_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_163_transpose_x_0 = const()[name = tensor("x_163_transpose_x_0"), val = tensor(false)]; tensor x_163_transpose_y_0 = const()[name = tensor("x_163_transpose_y_0"), val = tensor(false)]; tensor op_1794_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_1794_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141051712))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141151296))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141151104)))]; tensor q_with_bias_v_13_cast_fp16 = transpose(perm = q_with_bias_v_13_perm_0, x = var_1792_cast_fp16)[name = tensor("transpose_308")]; tensor x_163_cast_fp16 = matmul(transpose_x = x_163_transpose_x_0, transpose_y = x_163_transpose_y_0, x = q_with_bias_v_13_cast_fp16, y = op_1794_to_fp16_quantized)[name = tensor("x_163_cast_fp16")]; tensor x_165_pad_0 = const()[name = tensor("x_165_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_165_mode_0 = const()[name = tensor("x_165_mode_0"), val = tensor("constant")]; tensor const_157_to_fp16 = const()[name = tensor("const_157_to_fp16"), val = tensor(0x0p+0)]; tensor x_165_cast_fp16 = pad(constant_val = const_157_to_fp16, mode = x_165_mode_0, pad = x_165_pad_0, x = x_163_cast_fp16)[name = tensor("x_165_cast_fp16")]; tensor var_1802 = const()[name = tensor("op_1802"), val = tensor([1, 8, -1, 7])]; tensor x_167_cast_fp16 = reshape(shape = var_1802, x = x_165_cast_fp16)[name = tensor("x_167_cast_fp16")]; tensor var_1806_begin_0 = const()[name = tensor("op_1806_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_1806_end_0 = const()[name = tensor("op_1806_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_1806_end_mask_0 = const()[name = tensor("op_1806_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_1806_cast_fp16 = slice_by_index(begin = var_1806_begin_0, end = var_1806_end_0, end_mask = var_1806_end_mask_0, x = x_167_cast_fp16)[name = tensor("op_1806_cast_fp16")]; tensor var_1807 = const()[name = tensor("op_1807"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_25_cast_fp16 = reshape(shape = var_1807, x = var_1806_cast_fp16)[name = tensor("matrix_bd_25_cast_fp16")]; tensor matrix_ac_13_transpose_x_0 = const()[name = tensor("matrix_ac_13_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_13_transpose_y_0 = const()[name = tensor("matrix_ac_13_transpose_y_0"), val = tensor(false)]; tensor transpose_108_perm_0 = const()[name = tensor("transpose_108_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_109_perm_0 = const()[name = tensor("transpose_109_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_109 = transpose(perm = transpose_109_perm_0, x = k_25_cast_fp16)[name = tensor("transpose_306")]; tensor transpose_108 = transpose(perm = transpose_108_perm_0, x = var_1790_cast_fp16)[name = tensor("transpose_307")]; tensor matrix_ac_13_cast_fp16 = matmul(transpose_x = matrix_ac_13_transpose_x_0, transpose_y = matrix_ac_13_transpose_y_0, x = transpose_108, y = transpose_109)[name = tensor("matrix_ac_13_cast_fp16")]; tensor matrix_bd_27_begin_0 = const()[name = tensor("matrix_bd_27_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_27_end_0 = const()[name = tensor("matrix_bd_27_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_27_end_mask_0 = const()[name = tensor("matrix_bd_27_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_27_cast_fp16 = slice_by_index(begin = matrix_bd_27_begin_0, end = matrix_bd_27_end_0, end_mask = matrix_bd_27_end_mask_0, x = matrix_bd_25_cast_fp16)[name = tensor("matrix_bd_27_cast_fp16")]; tensor var_1816_cast_fp16 = add(x = matrix_ac_13_cast_fp16, y = matrix_bd_27_cast_fp16)[name = tensor("op_1816_cast_fp16")]; tensor _inversed_scores_25_y_0_to_fp16 = const()[name = tensor("_inversed_scores_25_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_25_cast_fp16 = mul(x = var_1816_cast_fp16, y = _inversed_scores_25_y_0_to_fp16)[name = tensor("_inversed_scores_25_cast_fp16")]; tensor scores_27_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_25_cast_fp16, cond = mask_11)[name = tensor("scores_27_cast_fp16")]; tensor var_1822_cast_fp16 = softmax(axis = var_59, x = scores_27_cast_fp16)[name = tensor("op_1822_cast_fp16")]; tensor input_353_cast_fp16 = select(a = var_44_to_fp16, b = var_1822_cast_fp16, cond = mask_11)[name = tensor("input_353_cast_fp16")]; tensor x_169_transpose_x_0 = const()[name = tensor("x_169_transpose_x_0"), val = tensor(false)]; tensor x_169_transpose_y_0 = const()[name = tensor("x_169_transpose_y_0"), val = tensor(false)]; tensor value_21_cast_fp16 = transpose(perm = value_21_perm_0, x = v_13_cast_fp16)[name = tensor("transpose_305")]; tensor x_169_cast_fp16 = matmul(transpose_x = x_169_transpose_x_0, transpose_y = x_169_transpose_y_0, x = input_353_cast_fp16, y = value_21_cast_fp16)[name = tensor("x_169_cast_fp16")]; tensor var_1826_perm_0 = const()[name = tensor("op_1826_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1827 = const()[name = tensor("op_1827"), val = tensor([1, -1, 1024])]; tensor var_1826_cast_fp16 = transpose(perm = var_1826_perm_0, x = x_169_cast_fp16)[name = tensor("transpose_304")]; tensor input_355_cast_fp16 = reshape(shape = var_1827, x = var_1826_cast_fp16)[name = tensor("input_355_cast_fp16")]; tensor encoder_layers_6_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141151616))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141938112))), name = tensor("encoder_layers_6_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_6_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141938304)))]; tensor linear_61_cast_fp16 = linear(bias = encoder_layers_6_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_6_self_attn_linear_out_weight_to_fp16_palettized, x = input_355_cast_fp16)[name = tensor("linear_61_cast_fp16")]; tensor input_359_cast_fp16 = add(x = input_349_cast_fp16, y = linear_61_cast_fp16)[name = tensor("input_359_cast_fp16")]; tensor x_173_axes_0 = const()[name = tensor("x_173_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141940416)))]; tensor encoder_layers_6_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141942528)))]; tensor x_173_cast_fp16 = layer_norm(axes = x_173_axes_0, beta = encoder_layers_6_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_6_norm_conv_weight_to_fp16, x = input_359_cast_fp16)[name = tensor("x_173_cast_fp16")]; tensor input_361_perm_0 = const()[name = tensor("input_361_perm_0"), val = tensor([0, 2, 1])]; tensor input_363_pad_type_0 = const()[name = tensor("input_363_pad_type_0"), val = tensor("valid")]; tensor input_363_strides_0 = const()[name = tensor("input_363_strides_0"), val = tensor([1])]; tensor input_363_pad_0 = const()[name = tensor("input_363_pad_0"), val = tensor([0, 0])]; tensor input_363_dilations_0 = const()[name = tensor("input_363_dilations_0"), val = tensor([1])]; tensor input_363_groups_0 = const()[name = tensor("input_363_groups_0"), val = tensor(1)]; tensor encoder_layers_6_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_6_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141944640))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144041856))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_361_cast_fp16 = transpose(perm = input_361_perm_0, x = x_173_cast_fp16)[name = tensor("transpose_303")]; tensor input_363_cast_fp16 = conv(dilations = input_363_dilations_0, groups = input_363_groups_0, pad = input_363_pad_0, pad_type = input_363_pad_type_0, strides = input_363_strides_0, weight = encoder_layers_6_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_361_cast_fp16)[name = tensor("input_363_cast_fp16")]; tensor x_175_split_num_splits_0 = const()[name = tensor("x_175_split_num_splits_0"), val = tensor(2)]; tensor x_175_split_axis_0 = const()[name = tensor("x_175_split_axis_0"), val = tensor(1)]; tensor x_175_split_cast_fp16_0, tensor x_175_split_cast_fp16_1 = split(axis = x_175_split_axis_0, num_splits = x_175_split_num_splits_0, x = input_363_cast_fp16)[name = tensor("x_175_split_cast_fp16")]; tensor x_175_split_1_sigmoid_cast_fp16 = sigmoid(x = x_175_split_cast_fp16_1)[name = tensor("x_175_split_1_sigmoid_cast_fp16")]; tensor x_175_cast_fp16 = mul(x = x_175_split_cast_fp16_0, y = x_175_split_1_sigmoid_cast_fp16)[name = tensor("x_175_cast_fp16")]; tensor input_365_cast_fp16 = select(a = var_44_to_fp16, b = x_175_cast_fp16, cond = var_575)[name = tensor("input_365_cast_fp16")]; tensor new_x_27_interleave_0 = const()[name = tensor("new_x_27_interleave_0"), val = tensor(false)]; tensor new_x_27_cast_fp16 = concat(axis = var_59, interleave = new_x_27_interleave_0, values = (cache_27_cast_fp16, input_365_cast_fp16))[name = tensor("new_x_27_cast_fp16")]; tensor var_1866_begin_0 = const()[name = tensor("op_1866_begin_0"), val = tensor([0, 0, 7])]; tensor var_1866_end_0 = const()[name = tensor("op_1866_end_0"), val = tensor([1, 1024, 15])]; tensor var_1866_end_mask_0 = const()[name = tensor("op_1866_end_mask_0"), val = tensor([true, true, true])]; tensor var_1866_cast_fp16 = slice_by_index(begin = var_1866_begin_0, end = var_1866_end_0, end_mask = var_1866_end_mask_0, x = new_x_27_cast_fp16)[name = tensor("op_1866_cast_fp16")]; tensor x_177_pad_type_0 = const()[name = tensor("x_177_pad_type_0"), val = tensor("valid")]; tensor x_177_groups_0 = const()[name = tensor("x_177_groups_0"), val = tensor(1024)]; tensor x_177_strides_0 = const()[name = tensor("x_177_strides_0"), val = tensor([1])]; tensor x_177_pad_0 = const()[name = tensor("x_177_pad_0"), val = tensor([0, 0])]; tensor x_177_dilations_0 = const()[name = tensor("x_177_dilations_0"), val = tensor([1])]; tensor encoder_layers_6_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_6_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144046016))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144055296))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_177_cast_fp16 = conv(dilations = x_177_dilations_0, groups = x_177_groups_0, pad = x_177_pad_0, pad_type = x_177_pad_type_0, strides = x_177_strides_0, weight = encoder_layers_6_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_27_cast_fp16)[name = tensor("x_177_cast_fp16")]; tensor input_367_perm_0 = const()[name = tensor("input_367_perm_0"), val = tensor([0, 2, 1])]; tensor x_179_axes_0 = const()[name = tensor("x_179_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_6_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144057408)))]; tensor encoder_layers_6_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_6_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144059520)))]; tensor input_367_cast_fp16 = transpose(perm = input_367_perm_0, x = x_177_cast_fp16)[name = tensor("transpose_302")]; tensor x_179_cast_fp16 = layer_norm(axes = x_179_axes_0, beta = encoder_layers_6_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_6_conv_batch_norm_weight_to_fp16, x = input_367_cast_fp16)[name = tensor("x_179_cast_fp16")]; tensor input_369_perm_0 = const()[name = tensor("input_369_perm_0"), val = tensor([0, 2, 1])]; tensor input_369_cast_fp16 = transpose(perm = input_369_perm_0, x = x_179_cast_fp16)[name = tensor("transpose_301")]; tensor input_371_cast_fp16 = silu(x = input_369_cast_fp16)[name = tensor("input_371_cast_fp16")]; tensor x_181_pad_type_0 = const()[name = tensor("x_181_pad_type_0"), val = tensor("valid")]; tensor x_181_strides_0 = const()[name = tensor("x_181_strides_0"), val = tensor([1])]; tensor x_181_pad_0 = const()[name = tensor("x_181_pad_0"), val = tensor([0, 0])]; tensor x_181_dilations_0 = const()[name = tensor("x_181_dilations_0"), val = tensor([1])]; tensor x_181_groups_0 = const()[name = tensor("x_181_groups_0"), val = tensor(1)]; tensor encoder_layers_6_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_6_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144061632))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145110272))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_181_cast_fp16 = conv(dilations = x_181_dilations_0, groups = x_181_groups_0, pad = x_181_pad_0, pad_type = x_181_pad_type_0, strides = x_181_strides_0, weight = encoder_layers_6_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_371_cast_fp16)[name = tensor("x_181_cast_fp16")]; tensor input_373_perm_0 = const()[name = tensor("input_373_perm_0"), val = tensor([0, 2, 1])]; tensor input_373_cast_fp16 = transpose(perm = input_373_perm_0, x = x_181_cast_fp16)[name = tensor("transpose_300")]; tensor input_375_cast_fp16 = add(x = input_359_cast_fp16, y = input_373_cast_fp16)[name = tensor("input_375_cast_fp16")]; tensor input_377_axes_0 = const()[name = tensor("input_377_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145112384)))]; tensor encoder_layers_6_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145114496)))]; tensor input_377_cast_fp16 = layer_norm(axes = input_377_axes_0, beta = encoder_layers_6_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_6_norm_feed_forward2_weight_to_fp16, x = input_375_cast_fp16)[name = tensor("input_377_cast_fp16")]; tensor encoder_layers_6_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145116608))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148262400))), name = tensor("encoder_layers_6_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_6_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_6_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148262592)))]; tensor linear_62_cast_fp16 = linear(bias = encoder_layers_6_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_6_feed_forward2_linear1_weight_to_fp16_palettized, x = input_377_cast_fp16)[name = tensor("linear_62_cast_fp16")]; tensor input_381_cast_fp16 = silu(x = linear_62_cast_fp16)[name = tensor("input_381_cast_fp16")]; tensor encoder_layers_6_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148270848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151416640))), name = tensor("encoder_layers_6_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_6_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_6_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151416832)))]; tensor linear_63_cast_fp16 = linear(bias = encoder_layers_6_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_6_feed_forward2_linear2_weight_to_fp16_palettized, x = input_381_cast_fp16)[name = tensor("linear_63_cast_fp16")]; tensor var_1909_to_fp16 = const()[name = tensor("op_1909_to_fp16"), val = tensor(0x1p-1)]; tensor var_1910_cast_fp16 = mul(x = linear_63_cast_fp16, y = var_1909_to_fp16)[name = tensor("op_1910_cast_fp16")]; tensor input_387_cast_fp16 = add(x = input_375_cast_fp16, y = var_1910_cast_fp16)[name = tensor("input_387_cast_fp16")]; tensor input_389_axes_0 = const()[name = tensor("input_389_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151418944)))]; tensor encoder_layers_6_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151421056)))]; tensor input_389_cast_fp16 = layer_norm(axes = input_389_axes_0, beta = encoder_layers_6_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_6_norm_out_weight_to_fp16, x = input_387_cast_fp16)[name = tensor("input_389_cast_fp16")]; tensor cache_29_begin_0 = const()[name = tensor("cache_29_begin_0"), val = tensor([7, 0, 0, 0])]; tensor cache_29_end_0 = const()[name = tensor("cache_29_end_0"), val = tensor([8, 1, 42, 1024])]; tensor cache_29_end_mask_0 = const()[name = tensor("cache_29_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_29_squeeze_mask_0 = const()[name = tensor("cache_29_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_29_cast_fp16 = slice_by_index(begin = cache_29_begin_0, end = cache_29_end_0, end_mask = cache_29_end_mask_0, squeeze_mask = cache_29_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_29_cast_fp16")]; tensor cache_31_begin_0 = const()[name = tensor("cache_31_begin_0"), val = tensor([7, 0, 0, 0])]; tensor cache_31_end_0 = const()[name = tensor("cache_31_end_0"), val = tensor([8, 1, 1024, 8])]; tensor cache_31_end_mask_0 = const()[name = tensor("cache_31_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_31_squeeze_mask_0 = const()[name = tensor("cache_31_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_31_cast_fp16 = slice_by_index(begin = cache_31_begin_0, end = cache_31_end_0, end_mask = cache_31_end_mask_0, squeeze_mask = cache_31_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_31_cast_fp16")]; tensor input_391_axes_0 = const()[name = tensor("input_391_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151423168)))]; tensor encoder_layers_7_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151425280)))]; tensor input_391_cast_fp16 = layer_norm(axes = input_391_axes_0, beta = encoder_layers_7_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_7_norm_feed_forward1_weight_to_fp16, x = input_389_cast_fp16)[name = tensor("input_391_cast_fp16")]; tensor encoder_layers_7_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151427392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154573184))), name = tensor("encoder_layers_7_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_7_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_7_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154573376)))]; tensor linear_64_cast_fp16 = linear(bias = encoder_layers_7_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_7_feed_forward1_linear1_weight_to_fp16_palettized, x = input_391_cast_fp16)[name = tensor("linear_64_cast_fp16")]; tensor input_395_cast_fp16 = silu(x = linear_64_cast_fp16)[name = tensor("input_395_cast_fp16")]; tensor encoder_layers_7_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154581632))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157727424))), name = tensor("encoder_layers_7_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_7_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_7_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157727616)))]; tensor linear_65_cast_fp16 = linear(bias = encoder_layers_7_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_7_feed_forward1_linear2_weight_to_fp16_palettized, x = input_395_cast_fp16)[name = tensor("linear_65_cast_fp16")]; tensor var_1946_to_fp16 = const()[name = tensor("op_1946_to_fp16"), val = tensor(0x1p-1)]; tensor var_1947_cast_fp16 = mul(x = linear_65_cast_fp16, y = var_1946_to_fp16)[name = tensor("op_1947_cast_fp16")]; tensor input_401_cast_fp16 = add(x = input_389_cast_fp16, y = var_1947_cast_fp16)[name = tensor("input_401_cast_fp16")]; tensor key_15_axes_0 = const()[name = tensor("key_15_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157729728)))]; tensor encoder_layers_7_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157731840)))]; tensor key_15_cast_fp16 = layer_norm(axes = key_15_axes_0, beta = encoder_layers_7_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_7_norm_self_att_weight_to_fp16, x = input_401_cast_fp16)[name = tensor("key_15_cast_fp16")]; tensor input_403_interleave_0 = const()[name = tensor("input_403_interleave_0"), val = tensor(false)]; tensor input_403_cast_fp16 = concat(axis = var_68, interleave = input_403_interleave_0, values = (cache_29_cast_fp16, key_15_cast_fp16))[name = tensor("input_403_cast_fp16")]; tensor var_1969_begin_0 = const()[name = tensor("op_1969_begin_0"), val = tensor([0, 7, 0])]; tensor var_1969_end_0 = const()[name = tensor("op_1969_end_0"), val = tensor([1, 42, 1024])]; tensor var_1969_end_mask_0 = const()[name = tensor("op_1969_end_mask_0"), val = tensor([true, true, true])]; tensor var_1969_cast_fp16 = slice_by_index(begin = var_1969_begin_0, end = var_1969_end_0, end_mask = var_1969_end_mask_0, x = cache_29_cast_fp16)[name = tensor("op_1969_cast_fp16")]; tensor var_1975_interleave_0 = const()[name = tensor("op_1975_interleave_0"), val = tensor(false)]; tensor var_1975_cast_fp16 = concat(axis = var_68, interleave = var_1975_interleave_0, values = (var_1969_cast_fp16, key_15_cast_fp16))[name = tensor("op_1975_cast_fp16")]; tensor encoder_layers_7_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157733952))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158520448))), name = tensor("encoder_layers_7_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_7_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158520640)))]; tensor linear_66_cast_fp16 = linear(bias = encoder_layers_7_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_7_self_attn_linear_q_weight_to_fp16_palettized, x = key_15_cast_fp16)[name = tensor("linear_66_cast_fp16")]; tensor var_1980 = const()[name = tensor("op_1980"), val = tensor([1, -1, 8, 128])]; tensor q_43_cast_fp16 = reshape(shape = var_1980, x = linear_66_cast_fp16)[name = tensor("q_43_cast_fp16")]; tensor encoder_layers_7_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158522752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159309248))), name = tensor("encoder_layers_7_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_7_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159309440)))]; tensor linear_67_cast_fp16 = linear(bias = encoder_layers_7_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_7_self_attn_linear_k_weight_to_fp16_palettized, x = input_403_cast_fp16)[name = tensor("linear_67_cast_fp16")]; tensor var_1985 = const()[name = tensor("op_1985"), val = tensor([1, -1, 8, 128])]; tensor k_29_cast_fp16 = reshape(shape = var_1985, x = linear_67_cast_fp16)[name = tensor("k_29_cast_fp16")]; tensor encoder_layers_7_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159311552))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160098048))), name = tensor("encoder_layers_7_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_7_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160098240)))]; tensor linear_68_cast_fp16 = linear(bias = encoder_layers_7_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_7_self_attn_linear_v_weight_to_fp16_palettized, x = input_403_cast_fp16)[name = tensor("linear_68_cast_fp16")]; tensor var_1990 = const()[name = tensor("op_1990"), val = tensor([1, -1, 8, 128])]; tensor v_15_cast_fp16 = reshape(shape = var_1990, x = linear_68_cast_fp16)[name = tensor("v_15_cast_fp16")]; tensor value_23_perm_0 = const()[name = tensor("value_23_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_7_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160100352)))]; tensor var_2003_cast_fp16 = add(x = q_43_cast_fp16, y = encoder_layers_7_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2003_cast_fp16")]; tensor encoder_layers_7_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160102464)))]; tensor var_2005_cast_fp16 = add(x = q_43_cast_fp16, y = encoder_layers_7_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2005_cast_fp16")]; tensor q_with_bias_v_15_perm_0 = const()[name = tensor("q_with_bias_v_15_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_189_transpose_x_0 = const()[name = tensor("x_189_transpose_x_0"), val = tensor(false)]; tensor x_189_transpose_y_0 = const()[name = tensor("x_189_transpose_y_0"), val = tensor(false)]; tensor op_2007_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_2007_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160104576))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160204160))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160203968)))]; tensor q_with_bias_v_15_cast_fp16 = transpose(perm = q_with_bias_v_15_perm_0, x = var_2005_cast_fp16)[name = tensor("transpose_299")]; tensor x_189_cast_fp16 = matmul(transpose_x = x_189_transpose_x_0, transpose_y = x_189_transpose_y_0, x = q_with_bias_v_15_cast_fp16, y = op_2007_to_fp16_quantized)[name = tensor("x_189_cast_fp16")]; tensor x_191_pad_0 = const()[name = tensor("x_191_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_191_mode_0 = const()[name = tensor("x_191_mode_0"), val = tensor("constant")]; tensor const_170_to_fp16 = const()[name = tensor("const_170_to_fp16"), val = tensor(0x0p+0)]; tensor x_191_cast_fp16 = pad(constant_val = const_170_to_fp16, mode = x_191_mode_0, pad = x_191_pad_0, x = x_189_cast_fp16)[name = tensor("x_191_cast_fp16")]; tensor var_2015 = const()[name = tensor("op_2015"), val = tensor([1, 8, -1, 7])]; tensor x_193_cast_fp16 = reshape(shape = var_2015, x = x_191_cast_fp16)[name = tensor("x_193_cast_fp16")]; tensor var_2019_begin_0 = const()[name = tensor("op_2019_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2019_end_0 = const()[name = tensor("op_2019_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_2019_end_mask_0 = const()[name = tensor("op_2019_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2019_cast_fp16 = slice_by_index(begin = var_2019_begin_0, end = var_2019_end_0, end_mask = var_2019_end_mask_0, x = x_193_cast_fp16)[name = tensor("op_2019_cast_fp16")]; tensor var_2020 = const()[name = tensor("op_2020"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_29_cast_fp16 = reshape(shape = var_2020, x = var_2019_cast_fp16)[name = tensor("matrix_bd_29_cast_fp16")]; tensor matrix_ac_15_transpose_x_0 = const()[name = tensor("matrix_ac_15_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_15_transpose_y_0 = const()[name = tensor("matrix_ac_15_transpose_y_0"), val = tensor(false)]; tensor transpose_110_perm_0 = const()[name = tensor("transpose_110_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_111_perm_0 = const()[name = tensor("transpose_111_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_111 = transpose(perm = transpose_111_perm_0, x = k_29_cast_fp16)[name = tensor("transpose_297")]; tensor transpose_110 = transpose(perm = transpose_110_perm_0, x = var_2003_cast_fp16)[name = tensor("transpose_298")]; tensor matrix_ac_15_cast_fp16 = matmul(transpose_x = matrix_ac_15_transpose_x_0, transpose_y = matrix_ac_15_transpose_y_0, x = transpose_110, y = transpose_111)[name = tensor("matrix_ac_15_cast_fp16")]; tensor matrix_bd_31_begin_0 = const()[name = tensor("matrix_bd_31_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_31_end_0 = const()[name = tensor("matrix_bd_31_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_31_end_mask_0 = const()[name = tensor("matrix_bd_31_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_31_cast_fp16 = slice_by_index(begin = matrix_bd_31_begin_0, end = matrix_bd_31_end_0, end_mask = matrix_bd_31_end_mask_0, x = matrix_bd_29_cast_fp16)[name = tensor("matrix_bd_31_cast_fp16")]; tensor var_2029_cast_fp16 = add(x = matrix_ac_15_cast_fp16, y = matrix_bd_31_cast_fp16)[name = tensor("op_2029_cast_fp16")]; tensor _inversed_scores_29_y_0_to_fp16 = const()[name = tensor("_inversed_scores_29_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_29_cast_fp16 = mul(x = var_2029_cast_fp16, y = _inversed_scores_29_y_0_to_fp16)[name = tensor("_inversed_scores_29_cast_fp16")]; tensor scores_31_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_29_cast_fp16, cond = mask_11)[name = tensor("scores_31_cast_fp16")]; tensor var_2035_cast_fp16 = softmax(axis = var_59, x = scores_31_cast_fp16)[name = tensor("op_2035_cast_fp16")]; tensor input_405_cast_fp16 = select(a = var_44_to_fp16, b = var_2035_cast_fp16, cond = mask_11)[name = tensor("input_405_cast_fp16")]; tensor x_195_transpose_x_0 = const()[name = tensor("x_195_transpose_x_0"), val = tensor(false)]; tensor x_195_transpose_y_0 = const()[name = tensor("x_195_transpose_y_0"), val = tensor(false)]; tensor value_23_cast_fp16 = transpose(perm = value_23_perm_0, x = v_15_cast_fp16)[name = tensor("transpose_296")]; tensor x_195_cast_fp16 = matmul(transpose_x = x_195_transpose_x_0, transpose_y = x_195_transpose_y_0, x = input_405_cast_fp16, y = value_23_cast_fp16)[name = tensor("x_195_cast_fp16")]; tensor var_2039_perm_0 = const()[name = tensor("op_2039_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2040 = const()[name = tensor("op_2040"), val = tensor([1, -1, 1024])]; tensor var_2039_cast_fp16 = transpose(perm = var_2039_perm_0, x = x_195_cast_fp16)[name = tensor("transpose_295")]; tensor input_407_cast_fp16 = reshape(shape = var_2040, x = var_2039_cast_fp16)[name = tensor("input_407_cast_fp16")]; tensor encoder_layers_7_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160204480))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160990976))), name = tensor("encoder_layers_7_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_7_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160991168)))]; tensor linear_70_cast_fp16 = linear(bias = encoder_layers_7_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_7_self_attn_linear_out_weight_to_fp16_palettized, x = input_407_cast_fp16)[name = tensor("linear_70_cast_fp16")]; tensor input_411_cast_fp16 = add(x = input_401_cast_fp16, y = linear_70_cast_fp16)[name = tensor("input_411_cast_fp16")]; tensor x_199_axes_0 = const()[name = tensor("x_199_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160993280)))]; tensor encoder_layers_7_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160995392)))]; tensor x_199_cast_fp16 = layer_norm(axes = x_199_axes_0, beta = encoder_layers_7_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_7_norm_conv_weight_to_fp16, x = input_411_cast_fp16)[name = tensor("x_199_cast_fp16")]; tensor input_413_perm_0 = const()[name = tensor("input_413_perm_0"), val = tensor([0, 2, 1])]; tensor input_415_pad_type_0 = const()[name = tensor("input_415_pad_type_0"), val = tensor("valid")]; tensor input_415_strides_0 = const()[name = tensor("input_415_strides_0"), val = tensor([1])]; tensor input_415_pad_0 = const()[name = tensor("input_415_pad_0"), val = tensor([0, 0])]; tensor input_415_dilations_0 = const()[name = tensor("input_415_dilations_0"), val = tensor([1])]; tensor input_415_groups_0 = const()[name = tensor("input_415_groups_0"), val = tensor(1)]; tensor encoder_layers_7_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_7_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160997504))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163094720))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_413_cast_fp16 = transpose(perm = input_413_perm_0, x = x_199_cast_fp16)[name = tensor("transpose_294")]; tensor input_415_cast_fp16 = conv(dilations = input_415_dilations_0, groups = input_415_groups_0, pad = input_415_pad_0, pad_type = input_415_pad_type_0, strides = input_415_strides_0, weight = encoder_layers_7_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_413_cast_fp16)[name = tensor("input_415_cast_fp16")]; tensor x_201_split_num_splits_0 = const()[name = tensor("x_201_split_num_splits_0"), val = tensor(2)]; tensor x_201_split_axis_0 = const()[name = tensor("x_201_split_axis_0"), val = tensor(1)]; tensor x_201_split_cast_fp16_0, tensor x_201_split_cast_fp16_1 = split(axis = x_201_split_axis_0, num_splits = x_201_split_num_splits_0, x = input_415_cast_fp16)[name = tensor("x_201_split_cast_fp16")]; tensor x_201_split_1_sigmoid_cast_fp16 = sigmoid(x = x_201_split_cast_fp16_1)[name = tensor("x_201_split_1_sigmoid_cast_fp16")]; tensor x_201_cast_fp16 = mul(x = x_201_split_cast_fp16_0, y = x_201_split_1_sigmoid_cast_fp16)[name = tensor("x_201_cast_fp16")]; tensor input_417_cast_fp16 = select(a = var_44_to_fp16, b = x_201_cast_fp16, cond = var_575)[name = tensor("input_417_cast_fp16")]; tensor new_x_31_interleave_0 = const()[name = tensor("new_x_31_interleave_0"), val = tensor(false)]; tensor new_x_31_cast_fp16 = concat(axis = var_59, interleave = new_x_31_interleave_0, values = (cache_31_cast_fp16, input_417_cast_fp16))[name = tensor("new_x_31_cast_fp16")]; tensor var_2079_begin_0 = const()[name = tensor("op_2079_begin_0"), val = tensor([0, 0, 7])]; tensor var_2079_end_0 = const()[name = tensor("op_2079_end_0"), val = tensor([1, 1024, 15])]; tensor var_2079_end_mask_0 = const()[name = tensor("op_2079_end_mask_0"), val = tensor([true, true, true])]; tensor var_2079_cast_fp16 = slice_by_index(begin = var_2079_begin_0, end = var_2079_end_0, end_mask = var_2079_end_mask_0, x = new_x_31_cast_fp16)[name = tensor("op_2079_cast_fp16")]; tensor x_203_pad_type_0 = const()[name = tensor("x_203_pad_type_0"), val = tensor("valid")]; tensor x_203_groups_0 = const()[name = tensor("x_203_groups_0"), val = tensor(1024)]; tensor x_203_strides_0 = const()[name = tensor("x_203_strides_0"), val = tensor([1])]; tensor x_203_pad_0 = const()[name = tensor("x_203_pad_0"), val = tensor([0, 0])]; tensor x_203_dilations_0 = const()[name = tensor("x_203_dilations_0"), val = tensor([1])]; tensor encoder_layers_7_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_7_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163098880))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163108160))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_203_cast_fp16 = conv(dilations = x_203_dilations_0, groups = x_203_groups_0, pad = x_203_pad_0, pad_type = x_203_pad_type_0, strides = x_203_strides_0, weight = encoder_layers_7_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_31_cast_fp16)[name = tensor("x_203_cast_fp16")]; tensor input_419_perm_0 = const()[name = tensor("input_419_perm_0"), val = tensor([0, 2, 1])]; tensor x_205_axes_0 = const()[name = tensor("x_205_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_7_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163110272)))]; tensor encoder_layers_7_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_7_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163112384)))]; tensor input_419_cast_fp16 = transpose(perm = input_419_perm_0, x = x_203_cast_fp16)[name = tensor("transpose_293")]; tensor x_205_cast_fp16 = layer_norm(axes = x_205_axes_0, beta = encoder_layers_7_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_7_conv_batch_norm_weight_to_fp16, x = input_419_cast_fp16)[name = tensor("x_205_cast_fp16")]; tensor input_421_perm_0 = const()[name = tensor("input_421_perm_0"), val = tensor([0, 2, 1])]; tensor input_421_cast_fp16 = transpose(perm = input_421_perm_0, x = x_205_cast_fp16)[name = tensor("transpose_292")]; tensor input_423_cast_fp16 = silu(x = input_421_cast_fp16)[name = tensor("input_423_cast_fp16")]; tensor x_207_pad_type_0 = const()[name = tensor("x_207_pad_type_0"), val = tensor("valid")]; tensor x_207_strides_0 = const()[name = tensor("x_207_strides_0"), val = tensor([1])]; tensor x_207_pad_0 = const()[name = tensor("x_207_pad_0"), val = tensor([0, 0])]; tensor x_207_dilations_0 = const()[name = tensor("x_207_dilations_0"), val = tensor([1])]; tensor x_207_groups_0 = const()[name = tensor("x_207_groups_0"), val = tensor(1)]; tensor encoder_layers_7_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_7_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163114496))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164163136))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_207_cast_fp16 = conv(dilations = x_207_dilations_0, groups = x_207_groups_0, pad = x_207_pad_0, pad_type = x_207_pad_type_0, strides = x_207_strides_0, weight = encoder_layers_7_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_423_cast_fp16)[name = tensor("x_207_cast_fp16")]; tensor input_425_perm_0 = const()[name = tensor("input_425_perm_0"), val = tensor([0, 2, 1])]; tensor input_425_cast_fp16 = transpose(perm = input_425_perm_0, x = x_207_cast_fp16)[name = tensor("transpose_291")]; tensor input_427_cast_fp16 = add(x = input_411_cast_fp16, y = input_425_cast_fp16)[name = tensor("input_427_cast_fp16")]; tensor input_429_axes_0 = const()[name = tensor("input_429_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164165248)))]; tensor encoder_layers_7_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164167360)))]; tensor input_429_cast_fp16 = layer_norm(axes = input_429_axes_0, beta = encoder_layers_7_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_7_norm_feed_forward2_weight_to_fp16, x = input_427_cast_fp16)[name = tensor("input_429_cast_fp16")]; tensor encoder_layers_7_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164169472))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167315264))), name = tensor("encoder_layers_7_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_7_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_7_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167315456)))]; tensor linear_71_cast_fp16 = linear(bias = encoder_layers_7_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_7_feed_forward2_linear1_weight_to_fp16_palettized, x = input_429_cast_fp16)[name = tensor("linear_71_cast_fp16")]; tensor input_433_cast_fp16 = silu(x = linear_71_cast_fp16)[name = tensor("input_433_cast_fp16")]; tensor encoder_layers_7_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167323712))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170469504))), name = tensor("encoder_layers_7_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_7_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_7_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170469696)))]; tensor linear_72_cast_fp16 = linear(bias = encoder_layers_7_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_7_feed_forward2_linear2_weight_to_fp16_palettized, x = input_433_cast_fp16)[name = tensor("linear_72_cast_fp16")]; tensor var_2122_to_fp16 = const()[name = tensor("op_2122_to_fp16"), val = tensor(0x1p-1)]; tensor var_2123_cast_fp16 = mul(x = linear_72_cast_fp16, y = var_2122_to_fp16)[name = tensor("op_2123_cast_fp16")]; tensor input_439_cast_fp16 = add(x = input_427_cast_fp16, y = var_2123_cast_fp16)[name = tensor("input_439_cast_fp16")]; tensor input_441_axes_0 = const()[name = tensor("input_441_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170471808)))]; tensor encoder_layers_7_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170473920)))]; tensor input_441_cast_fp16 = layer_norm(axes = input_441_axes_0, beta = encoder_layers_7_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_7_norm_out_weight_to_fp16, x = input_439_cast_fp16)[name = tensor("input_441_cast_fp16")]; tensor cache_33_begin_0 = const()[name = tensor("cache_33_begin_0"), val = tensor([8, 0, 0, 0])]; tensor cache_33_end_0 = const()[name = tensor("cache_33_end_0"), val = tensor([9, 1, 42, 1024])]; tensor cache_33_end_mask_0 = const()[name = tensor("cache_33_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_33_squeeze_mask_0 = const()[name = tensor("cache_33_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_33_cast_fp16 = slice_by_index(begin = cache_33_begin_0, end = cache_33_end_0, end_mask = cache_33_end_mask_0, squeeze_mask = cache_33_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_33_cast_fp16")]; tensor cache_35_begin_0 = const()[name = tensor("cache_35_begin_0"), val = tensor([8, 0, 0, 0])]; tensor cache_35_end_0 = const()[name = tensor("cache_35_end_0"), val = tensor([9, 1, 1024, 8])]; tensor cache_35_end_mask_0 = const()[name = tensor("cache_35_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_35_squeeze_mask_0 = const()[name = tensor("cache_35_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_35_cast_fp16 = slice_by_index(begin = cache_35_begin_0, end = cache_35_end_0, end_mask = cache_35_end_mask_0, squeeze_mask = cache_35_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_35_cast_fp16")]; tensor input_443_axes_0 = const()[name = tensor("input_443_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170476032)))]; tensor encoder_layers_8_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170478144)))]; tensor input_443_cast_fp16 = layer_norm(axes = input_443_axes_0, beta = encoder_layers_8_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_8_norm_feed_forward1_weight_to_fp16, x = input_441_cast_fp16)[name = tensor("input_443_cast_fp16")]; tensor encoder_layers_8_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170480256))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(173626048))), name = tensor("encoder_layers_8_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_8_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_8_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(173626240)))]; tensor linear_73_cast_fp16 = linear(bias = encoder_layers_8_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_8_feed_forward1_linear1_weight_to_fp16_palettized, x = input_443_cast_fp16)[name = tensor("linear_73_cast_fp16")]; tensor input_447_cast_fp16 = silu(x = linear_73_cast_fp16)[name = tensor("input_447_cast_fp16")]; tensor encoder_layers_8_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(173634496))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(176780288))), name = tensor("encoder_layers_8_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_8_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_8_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(176780480)))]; tensor linear_74_cast_fp16 = linear(bias = encoder_layers_8_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_8_feed_forward1_linear2_weight_to_fp16_palettized, x = input_447_cast_fp16)[name = tensor("linear_74_cast_fp16")]; tensor var_2159_to_fp16 = const()[name = tensor("op_2159_to_fp16"), val = tensor(0x1p-1)]; tensor var_2160_cast_fp16 = mul(x = linear_74_cast_fp16, y = var_2159_to_fp16)[name = tensor("op_2160_cast_fp16")]; tensor input_453_cast_fp16 = add(x = input_441_cast_fp16, y = var_2160_cast_fp16)[name = tensor("input_453_cast_fp16")]; tensor key_17_axes_0 = const()[name = tensor("key_17_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(176782592)))]; tensor encoder_layers_8_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(176784704)))]; tensor key_17_cast_fp16 = layer_norm(axes = key_17_axes_0, beta = encoder_layers_8_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_8_norm_self_att_weight_to_fp16, x = input_453_cast_fp16)[name = tensor("key_17_cast_fp16")]; tensor input_455_interleave_0 = const()[name = tensor("input_455_interleave_0"), val = tensor(false)]; tensor input_455_cast_fp16 = concat(axis = var_68, interleave = input_455_interleave_0, values = (cache_33_cast_fp16, key_17_cast_fp16))[name = tensor("input_455_cast_fp16")]; tensor var_2182_begin_0 = const()[name = tensor("op_2182_begin_0"), val = tensor([0, 7, 0])]; tensor var_2182_end_0 = const()[name = tensor("op_2182_end_0"), val = tensor([1, 42, 1024])]; tensor var_2182_end_mask_0 = const()[name = tensor("op_2182_end_mask_0"), val = tensor([true, true, true])]; tensor var_2182_cast_fp16 = slice_by_index(begin = var_2182_begin_0, end = var_2182_end_0, end_mask = var_2182_end_mask_0, x = cache_33_cast_fp16)[name = tensor("op_2182_cast_fp16")]; tensor var_2188_interleave_0 = const()[name = tensor("op_2188_interleave_0"), val = tensor(false)]; tensor var_2188_cast_fp16 = concat(axis = var_68, interleave = var_2188_interleave_0, values = (var_2182_cast_fp16, key_17_cast_fp16))[name = tensor("op_2188_cast_fp16")]; tensor encoder_layers_8_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(176786816))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177573312))), name = tensor("encoder_layers_8_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_8_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177573504)))]; tensor linear_75_cast_fp16 = linear(bias = encoder_layers_8_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_8_self_attn_linear_q_weight_to_fp16_palettized, x = key_17_cast_fp16)[name = tensor("linear_75_cast_fp16")]; tensor var_2193 = const()[name = tensor("op_2193"), val = tensor([1, -1, 8, 128])]; tensor q_49_cast_fp16 = reshape(shape = var_2193, x = linear_75_cast_fp16)[name = tensor("q_49_cast_fp16")]; tensor encoder_layers_8_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177575616))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178362112))), name = tensor("encoder_layers_8_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_8_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178362304)))]; tensor linear_76_cast_fp16 = linear(bias = encoder_layers_8_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_8_self_attn_linear_k_weight_to_fp16_palettized, x = input_455_cast_fp16)[name = tensor("linear_76_cast_fp16")]; tensor var_2198 = const()[name = tensor("op_2198"), val = tensor([1, -1, 8, 128])]; tensor k_33_cast_fp16 = reshape(shape = var_2198, x = linear_76_cast_fp16)[name = tensor("k_33_cast_fp16")]; tensor encoder_layers_8_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178364416))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179150912))), name = tensor("encoder_layers_8_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_8_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179151104)))]; tensor linear_77_cast_fp16 = linear(bias = encoder_layers_8_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_8_self_attn_linear_v_weight_to_fp16_palettized, x = input_455_cast_fp16)[name = tensor("linear_77_cast_fp16")]; tensor var_2203 = const()[name = tensor("op_2203"), val = tensor([1, -1, 8, 128])]; tensor v_17_cast_fp16 = reshape(shape = var_2203, x = linear_77_cast_fp16)[name = tensor("v_17_cast_fp16")]; tensor value_25_perm_0 = const()[name = tensor("value_25_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_8_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179153216)))]; tensor var_2216_cast_fp16 = add(x = q_49_cast_fp16, y = encoder_layers_8_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2216_cast_fp16")]; tensor encoder_layers_8_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179155328)))]; tensor var_2218_cast_fp16 = add(x = q_49_cast_fp16, y = encoder_layers_8_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2218_cast_fp16")]; tensor q_with_bias_v_17_perm_0 = const()[name = tensor("q_with_bias_v_17_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_215_transpose_x_0 = const()[name = tensor("x_215_transpose_x_0"), val = tensor(false)]; tensor x_215_transpose_y_0 = const()[name = tensor("x_215_transpose_y_0"), val = tensor(false)]; tensor op_2220_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_2220_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179157440))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179257024))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179256832)))]; tensor q_with_bias_v_17_cast_fp16 = transpose(perm = q_with_bias_v_17_perm_0, x = var_2218_cast_fp16)[name = tensor("transpose_290")]; tensor x_215_cast_fp16 = matmul(transpose_x = x_215_transpose_x_0, transpose_y = x_215_transpose_y_0, x = q_with_bias_v_17_cast_fp16, y = op_2220_to_fp16_quantized)[name = tensor("x_215_cast_fp16")]; tensor x_217_pad_0 = const()[name = tensor("x_217_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_217_mode_0 = const()[name = tensor("x_217_mode_0"), val = tensor("constant")]; tensor const_183_to_fp16 = const()[name = tensor("const_183_to_fp16"), val = tensor(0x0p+0)]; tensor x_217_cast_fp16 = pad(constant_val = const_183_to_fp16, mode = x_217_mode_0, pad = x_217_pad_0, x = x_215_cast_fp16)[name = tensor("x_217_cast_fp16")]; tensor var_2228 = const()[name = tensor("op_2228"), val = tensor([1, 8, -1, 7])]; tensor x_219_cast_fp16 = reshape(shape = var_2228, x = x_217_cast_fp16)[name = tensor("x_219_cast_fp16")]; tensor var_2232_begin_0 = const()[name = tensor("op_2232_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2232_end_0 = const()[name = tensor("op_2232_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_2232_end_mask_0 = const()[name = tensor("op_2232_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2232_cast_fp16 = slice_by_index(begin = var_2232_begin_0, end = var_2232_end_0, end_mask = var_2232_end_mask_0, x = x_219_cast_fp16)[name = tensor("op_2232_cast_fp16")]; tensor var_2233 = const()[name = tensor("op_2233"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_33_cast_fp16 = reshape(shape = var_2233, x = var_2232_cast_fp16)[name = tensor("matrix_bd_33_cast_fp16")]; tensor matrix_ac_17_transpose_x_0 = const()[name = tensor("matrix_ac_17_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_17_transpose_y_0 = const()[name = tensor("matrix_ac_17_transpose_y_0"), val = tensor(false)]; tensor transpose_112_perm_0 = const()[name = tensor("transpose_112_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_113_perm_0 = const()[name = tensor("transpose_113_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_113 = transpose(perm = transpose_113_perm_0, x = k_33_cast_fp16)[name = tensor("transpose_288")]; tensor transpose_112 = transpose(perm = transpose_112_perm_0, x = var_2216_cast_fp16)[name = tensor("transpose_289")]; tensor matrix_ac_17_cast_fp16 = matmul(transpose_x = matrix_ac_17_transpose_x_0, transpose_y = matrix_ac_17_transpose_y_0, x = transpose_112, y = transpose_113)[name = tensor("matrix_ac_17_cast_fp16")]; tensor matrix_bd_35_begin_0 = const()[name = tensor("matrix_bd_35_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_35_end_0 = const()[name = tensor("matrix_bd_35_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_35_end_mask_0 = const()[name = tensor("matrix_bd_35_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_35_cast_fp16 = slice_by_index(begin = matrix_bd_35_begin_0, end = matrix_bd_35_end_0, end_mask = matrix_bd_35_end_mask_0, x = matrix_bd_33_cast_fp16)[name = tensor("matrix_bd_35_cast_fp16")]; tensor var_2242_cast_fp16 = add(x = matrix_ac_17_cast_fp16, y = matrix_bd_35_cast_fp16)[name = tensor("op_2242_cast_fp16")]; tensor _inversed_scores_33_y_0_to_fp16 = const()[name = tensor("_inversed_scores_33_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_33_cast_fp16 = mul(x = var_2242_cast_fp16, y = _inversed_scores_33_y_0_to_fp16)[name = tensor("_inversed_scores_33_cast_fp16")]; tensor scores_35_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_33_cast_fp16, cond = mask_11)[name = tensor("scores_35_cast_fp16")]; tensor var_2248_cast_fp16 = softmax(axis = var_59, x = scores_35_cast_fp16)[name = tensor("op_2248_cast_fp16")]; tensor input_457_cast_fp16 = select(a = var_44_to_fp16, b = var_2248_cast_fp16, cond = mask_11)[name = tensor("input_457_cast_fp16")]; tensor x_221_transpose_x_0 = const()[name = tensor("x_221_transpose_x_0"), val = tensor(false)]; tensor x_221_transpose_y_0 = const()[name = tensor("x_221_transpose_y_0"), val = tensor(false)]; tensor value_25_cast_fp16 = transpose(perm = value_25_perm_0, x = v_17_cast_fp16)[name = tensor("transpose_287")]; tensor x_221_cast_fp16 = matmul(transpose_x = x_221_transpose_x_0, transpose_y = x_221_transpose_y_0, x = input_457_cast_fp16, y = value_25_cast_fp16)[name = tensor("x_221_cast_fp16")]; tensor var_2252_perm_0 = const()[name = tensor("op_2252_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2253 = const()[name = tensor("op_2253"), val = tensor([1, -1, 1024])]; tensor var_2252_cast_fp16 = transpose(perm = var_2252_perm_0, x = x_221_cast_fp16)[name = tensor("transpose_286")]; tensor input_459_cast_fp16 = reshape(shape = var_2253, x = var_2252_cast_fp16)[name = tensor("input_459_cast_fp16")]; tensor encoder_layers_8_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179257344))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180043840))), name = tensor("encoder_layers_8_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_8_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180044032)))]; tensor linear_79_cast_fp16 = linear(bias = encoder_layers_8_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_8_self_attn_linear_out_weight_to_fp16_palettized, x = input_459_cast_fp16)[name = tensor("linear_79_cast_fp16")]; tensor input_463_cast_fp16 = add(x = input_453_cast_fp16, y = linear_79_cast_fp16)[name = tensor("input_463_cast_fp16")]; tensor x_225_axes_0 = const()[name = tensor("x_225_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180046144)))]; tensor encoder_layers_8_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180048256)))]; tensor x_225_cast_fp16 = layer_norm(axes = x_225_axes_0, beta = encoder_layers_8_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_8_norm_conv_weight_to_fp16, x = input_463_cast_fp16)[name = tensor("x_225_cast_fp16")]; tensor input_465_perm_0 = const()[name = tensor("input_465_perm_0"), val = tensor([0, 2, 1])]; tensor input_467_pad_type_0 = const()[name = tensor("input_467_pad_type_0"), val = tensor("valid")]; tensor input_467_strides_0 = const()[name = tensor("input_467_strides_0"), val = tensor([1])]; tensor input_467_pad_0 = const()[name = tensor("input_467_pad_0"), val = tensor([0, 0])]; tensor input_467_dilations_0 = const()[name = tensor("input_467_dilations_0"), val = tensor([1])]; tensor input_467_groups_0 = const()[name = tensor("input_467_groups_0"), val = tensor(1)]; tensor encoder_layers_8_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_8_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180050368))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182147584))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_465_cast_fp16 = transpose(perm = input_465_perm_0, x = x_225_cast_fp16)[name = tensor("transpose_285")]; tensor input_467_cast_fp16 = conv(dilations = input_467_dilations_0, groups = input_467_groups_0, pad = input_467_pad_0, pad_type = input_467_pad_type_0, strides = input_467_strides_0, weight = encoder_layers_8_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_465_cast_fp16)[name = tensor("input_467_cast_fp16")]; tensor x_227_split_num_splits_0 = const()[name = tensor("x_227_split_num_splits_0"), val = tensor(2)]; tensor x_227_split_axis_0 = const()[name = tensor("x_227_split_axis_0"), val = tensor(1)]; tensor x_227_split_cast_fp16_0, tensor x_227_split_cast_fp16_1 = split(axis = x_227_split_axis_0, num_splits = x_227_split_num_splits_0, x = input_467_cast_fp16)[name = tensor("x_227_split_cast_fp16")]; tensor x_227_split_1_sigmoid_cast_fp16 = sigmoid(x = x_227_split_cast_fp16_1)[name = tensor("x_227_split_1_sigmoid_cast_fp16")]; tensor x_227_cast_fp16 = mul(x = x_227_split_cast_fp16_0, y = x_227_split_1_sigmoid_cast_fp16)[name = tensor("x_227_cast_fp16")]; tensor input_469_cast_fp16 = select(a = var_44_to_fp16, b = x_227_cast_fp16, cond = var_575)[name = tensor("input_469_cast_fp16")]; tensor new_x_35_interleave_0 = const()[name = tensor("new_x_35_interleave_0"), val = tensor(false)]; tensor new_x_35_cast_fp16 = concat(axis = var_59, interleave = new_x_35_interleave_0, values = (cache_35_cast_fp16, input_469_cast_fp16))[name = tensor("new_x_35_cast_fp16")]; tensor var_2292_begin_0 = const()[name = tensor("op_2292_begin_0"), val = tensor([0, 0, 7])]; tensor var_2292_end_0 = const()[name = tensor("op_2292_end_0"), val = tensor([1, 1024, 15])]; tensor var_2292_end_mask_0 = const()[name = tensor("op_2292_end_mask_0"), val = tensor([true, true, true])]; tensor var_2292_cast_fp16 = slice_by_index(begin = var_2292_begin_0, end = var_2292_end_0, end_mask = var_2292_end_mask_0, x = new_x_35_cast_fp16)[name = tensor("op_2292_cast_fp16")]; tensor x_229_pad_type_0 = const()[name = tensor("x_229_pad_type_0"), val = tensor("valid")]; tensor x_229_groups_0 = const()[name = tensor("x_229_groups_0"), val = tensor(1024)]; tensor x_229_strides_0 = const()[name = tensor("x_229_strides_0"), val = tensor([1])]; tensor x_229_pad_0 = const()[name = tensor("x_229_pad_0"), val = tensor([0, 0])]; tensor x_229_dilations_0 = const()[name = tensor("x_229_dilations_0"), val = tensor([1])]; tensor encoder_layers_8_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_8_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182151744))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182161024))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_229_cast_fp16 = conv(dilations = x_229_dilations_0, groups = x_229_groups_0, pad = x_229_pad_0, pad_type = x_229_pad_type_0, strides = x_229_strides_0, weight = encoder_layers_8_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_35_cast_fp16)[name = tensor("x_229_cast_fp16")]; tensor input_471_perm_0 = const()[name = tensor("input_471_perm_0"), val = tensor([0, 2, 1])]; tensor x_231_axes_0 = const()[name = tensor("x_231_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_8_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182163136)))]; tensor encoder_layers_8_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_8_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182165248)))]; tensor input_471_cast_fp16 = transpose(perm = input_471_perm_0, x = x_229_cast_fp16)[name = tensor("transpose_284")]; tensor x_231_cast_fp16 = layer_norm(axes = x_231_axes_0, beta = encoder_layers_8_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_8_conv_batch_norm_weight_to_fp16, x = input_471_cast_fp16)[name = tensor("x_231_cast_fp16")]; tensor input_473_perm_0 = const()[name = tensor("input_473_perm_0"), val = tensor([0, 2, 1])]; tensor input_473_cast_fp16 = transpose(perm = input_473_perm_0, x = x_231_cast_fp16)[name = tensor("transpose_283")]; tensor input_475_cast_fp16 = silu(x = input_473_cast_fp16)[name = tensor("input_475_cast_fp16")]; tensor x_233_pad_type_0 = const()[name = tensor("x_233_pad_type_0"), val = tensor("valid")]; tensor x_233_strides_0 = const()[name = tensor("x_233_strides_0"), val = tensor([1])]; tensor x_233_pad_0 = const()[name = tensor("x_233_pad_0"), val = tensor([0, 0])]; tensor x_233_dilations_0 = const()[name = tensor("x_233_dilations_0"), val = tensor([1])]; tensor x_233_groups_0 = const()[name = tensor("x_233_groups_0"), val = tensor(1)]; tensor encoder_layers_8_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_8_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182167360))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183216000))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_233_cast_fp16 = conv(dilations = x_233_dilations_0, groups = x_233_groups_0, pad = x_233_pad_0, pad_type = x_233_pad_type_0, strides = x_233_strides_0, weight = encoder_layers_8_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_475_cast_fp16)[name = tensor("x_233_cast_fp16")]; tensor input_477_perm_0 = const()[name = tensor("input_477_perm_0"), val = tensor([0, 2, 1])]; tensor input_477_cast_fp16 = transpose(perm = input_477_perm_0, x = x_233_cast_fp16)[name = tensor("transpose_282")]; tensor input_479_cast_fp16 = add(x = input_463_cast_fp16, y = input_477_cast_fp16)[name = tensor("input_479_cast_fp16")]; tensor input_481_axes_0 = const()[name = tensor("input_481_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183218112)))]; tensor encoder_layers_8_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183220224)))]; tensor input_481_cast_fp16 = layer_norm(axes = input_481_axes_0, beta = encoder_layers_8_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_8_norm_feed_forward2_weight_to_fp16, x = input_479_cast_fp16)[name = tensor("input_481_cast_fp16")]; tensor encoder_layers_8_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183222336))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186368128))), name = tensor("encoder_layers_8_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_8_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_8_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186368320)))]; tensor linear_80_cast_fp16 = linear(bias = encoder_layers_8_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_8_feed_forward2_linear1_weight_to_fp16_palettized, x = input_481_cast_fp16)[name = tensor("linear_80_cast_fp16")]; tensor input_485_cast_fp16 = silu(x = linear_80_cast_fp16)[name = tensor("input_485_cast_fp16")]; tensor encoder_layers_8_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186376576))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(189522368))), name = tensor("encoder_layers_8_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_8_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_8_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(189522560)))]; tensor linear_81_cast_fp16 = linear(bias = encoder_layers_8_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_8_feed_forward2_linear2_weight_to_fp16_palettized, x = input_485_cast_fp16)[name = tensor("linear_81_cast_fp16")]; tensor var_2335_to_fp16 = const()[name = tensor("op_2335_to_fp16"), val = tensor(0x1p-1)]; tensor var_2336_cast_fp16 = mul(x = linear_81_cast_fp16, y = var_2335_to_fp16)[name = tensor("op_2336_cast_fp16")]; tensor input_491_cast_fp16 = add(x = input_479_cast_fp16, y = var_2336_cast_fp16)[name = tensor("input_491_cast_fp16")]; tensor input_493_axes_0 = const()[name = tensor("input_493_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(189524672)))]; tensor encoder_layers_8_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(189526784)))]; tensor input_493_cast_fp16 = layer_norm(axes = input_493_axes_0, beta = encoder_layers_8_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_8_norm_out_weight_to_fp16, x = input_491_cast_fp16)[name = tensor("input_493_cast_fp16")]; tensor cache_37_begin_0 = const()[name = tensor("cache_37_begin_0"), val = tensor([9, 0, 0, 0])]; tensor cache_37_end_0 = const()[name = tensor("cache_37_end_0"), val = tensor([10, 1, 42, 1024])]; tensor cache_37_end_mask_0 = const()[name = tensor("cache_37_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_37_squeeze_mask_0 = const()[name = tensor("cache_37_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_37_cast_fp16 = slice_by_index(begin = cache_37_begin_0, end = cache_37_end_0, end_mask = cache_37_end_mask_0, squeeze_mask = cache_37_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_37_cast_fp16")]; tensor cache_39_begin_0 = const()[name = tensor("cache_39_begin_0"), val = tensor([9, 0, 0, 0])]; tensor cache_39_end_0 = const()[name = tensor("cache_39_end_0"), val = tensor([10, 1, 1024, 8])]; tensor cache_39_end_mask_0 = const()[name = tensor("cache_39_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_39_squeeze_mask_0 = const()[name = tensor("cache_39_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_39_cast_fp16 = slice_by_index(begin = cache_39_begin_0, end = cache_39_end_0, end_mask = cache_39_end_mask_0, squeeze_mask = cache_39_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_39_cast_fp16")]; tensor input_495_axes_0 = const()[name = tensor("input_495_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(189528896)))]; tensor encoder_layers_9_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(189531008)))]; tensor input_495_cast_fp16 = layer_norm(axes = input_495_axes_0, beta = encoder_layers_9_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_9_norm_feed_forward1_weight_to_fp16, x = input_493_cast_fp16)[name = tensor("input_495_cast_fp16")]; tensor encoder_layers_9_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(189533120))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192678912))), name = tensor("encoder_layers_9_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_9_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_9_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192679104)))]; tensor linear_82_cast_fp16 = linear(bias = encoder_layers_9_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_9_feed_forward1_linear1_weight_to_fp16_palettized, x = input_495_cast_fp16)[name = tensor("linear_82_cast_fp16")]; tensor input_499_cast_fp16 = silu(x = linear_82_cast_fp16)[name = tensor("input_499_cast_fp16")]; tensor encoder_layers_9_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192687360))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195833152))), name = tensor("encoder_layers_9_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_9_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_9_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195833344)))]; tensor linear_83_cast_fp16 = linear(bias = encoder_layers_9_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_9_feed_forward1_linear2_weight_to_fp16_palettized, x = input_499_cast_fp16)[name = tensor("linear_83_cast_fp16")]; tensor var_2372_to_fp16 = const()[name = tensor("op_2372_to_fp16"), val = tensor(0x1p-1)]; tensor var_2373_cast_fp16 = mul(x = linear_83_cast_fp16, y = var_2372_to_fp16)[name = tensor("op_2373_cast_fp16")]; tensor input_505_cast_fp16 = add(x = input_493_cast_fp16, y = var_2373_cast_fp16)[name = tensor("input_505_cast_fp16")]; tensor key_19_axes_0 = const()[name = tensor("key_19_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195835456)))]; tensor encoder_layers_9_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195837568)))]; tensor key_19_cast_fp16 = layer_norm(axes = key_19_axes_0, beta = encoder_layers_9_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_9_norm_self_att_weight_to_fp16, x = input_505_cast_fp16)[name = tensor("key_19_cast_fp16")]; tensor input_507_interleave_0 = const()[name = tensor("input_507_interleave_0"), val = tensor(false)]; tensor input_507_cast_fp16 = concat(axis = var_68, interleave = input_507_interleave_0, values = (cache_37_cast_fp16, key_19_cast_fp16))[name = tensor("input_507_cast_fp16")]; tensor var_2395_begin_0 = const()[name = tensor("op_2395_begin_0"), val = tensor([0, 7, 0])]; tensor var_2395_end_0 = const()[name = tensor("op_2395_end_0"), val = tensor([1, 42, 1024])]; tensor var_2395_end_mask_0 = const()[name = tensor("op_2395_end_mask_0"), val = tensor([true, true, true])]; tensor var_2395_cast_fp16 = slice_by_index(begin = var_2395_begin_0, end = var_2395_end_0, end_mask = var_2395_end_mask_0, x = cache_37_cast_fp16)[name = tensor("op_2395_cast_fp16")]; tensor var_2401_interleave_0 = const()[name = tensor("op_2401_interleave_0"), val = tensor(false)]; tensor var_2401_cast_fp16 = concat(axis = var_68, interleave = var_2401_interleave_0, values = (var_2395_cast_fp16, key_19_cast_fp16))[name = tensor("op_2401_cast_fp16")]; tensor encoder_layers_9_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195839680))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196626176))), name = tensor("encoder_layers_9_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_9_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196626368)))]; tensor linear_84_cast_fp16 = linear(bias = encoder_layers_9_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_9_self_attn_linear_q_weight_to_fp16_palettized, x = key_19_cast_fp16)[name = tensor("linear_84_cast_fp16")]; tensor var_2406 = const()[name = tensor("op_2406"), val = tensor([1, -1, 8, 128])]; tensor q_55_cast_fp16 = reshape(shape = var_2406, x = linear_84_cast_fp16)[name = tensor("q_55_cast_fp16")]; tensor encoder_layers_9_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196628480))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(197414976))), name = tensor("encoder_layers_9_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_9_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(197415168)))]; tensor linear_85_cast_fp16 = linear(bias = encoder_layers_9_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_9_self_attn_linear_k_weight_to_fp16_palettized, x = input_507_cast_fp16)[name = tensor("linear_85_cast_fp16")]; tensor var_2411 = const()[name = tensor("op_2411"), val = tensor([1, -1, 8, 128])]; tensor k_37_cast_fp16 = reshape(shape = var_2411, x = linear_85_cast_fp16)[name = tensor("k_37_cast_fp16")]; tensor encoder_layers_9_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(197417280))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198203776))), name = tensor("encoder_layers_9_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_9_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198203968)))]; tensor linear_86_cast_fp16 = linear(bias = encoder_layers_9_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_9_self_attn_linear_v_weight_to_fp16_palettized, x = input_507_cast_fp16)[name = tensor("linear_86_cast_fp16")]; tensor var_2416 = const()[name = tensor("op_2416"), val = tensor([1, -1, 8, 128])]; tensor v_19_cast_fp16 = reshape(shape = var_2416, x = linear_86_cast_fp16)[name = tensor("v_19_cast_fp16")]; tensor value_27_perm_0 = const()[name = tensor("value_27_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_9_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198206080)))]; tensor var_2429_cast_fp16 = add(x = q_55_cast_fp16, y = encoder_layers_9_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2429_cast_fp16")]; tensor encoder_layers_9_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198208192)))]; tensor var_2431_cast_fp16 = add(x = q_55_cast_fp16, y = encoder_layers_9_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2431_cast_fp16")]; tensor q_with_bias_v_19_perm_0 = const()[name = tensor("q_with_bias_v_19_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_241_transpose_x_0 = const()[name = tensor("x_241_transpose_x_0"), val = tensor(false)]; tensor x_241_transpose_y_0 = const()[name = tensor("x_241_transpose_y_0"), val = tensor(false)]; tensor op_2433_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_2433_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198210304))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198309888))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198309696)))]; tensor q_with_bias_v_19_cast_fp16 = transpose(perm = q_with_bias_v_19_perm_0, x = var_2431_cast_fp16)[name = tensor("transpose_281")]; tensor x_241_cast_fp16 = matmul(transpose_x = x_241_transpose_x_0, transpose_y = x_241_transpose_y_0, x = q_with_bias_v_19_cast_fp16, y = op_2433_to_fp16_quantized)[name = tensor("x_241_cast_fp16")]; tensor x_243_pad_0 = const()[name = tensor("x_243_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_243_mode_0 = const()[name = tensor("x_243_mode_0"), val = tensor("constant")]; tensor const_196_to_fp16 = const()[name = tensor("const_196_to_fp16"), val = tensor(0x0p+0)]; tensor x_243_cast_fp16 = pad(constant_val = const_196_to_fp16, mode = x_243_mode_0, pad = x_243_pad_0, x = x_241_cast_fp16)[name = tensor("x_243_cast_fp16")]; tensor var_2441 = const()[name = tensor("op_2441"), val = tensor([1, 8, -1, 7])]; tensor x_245_cast_fp16 = reshape(shape = var_2441, x = x_243_cast_fp16)[name = tensor("x_245_cast_fp16")]; tensor var_2445_begin_0 = const()[name = tensor("op_2445_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2445_end_0 = const()[name = tensor("op_2445_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_2445_end_mask_0 = const()[name = tensor("op_2445_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2445_cast_fp16 = slice_by_index(begin = var_2445_begin_0, end = var_2445_end_0, end_mask = var_2445_end_mask_0, x = x_245_cast_fp16)[name = tensor("op_2445_cast_fp16")]; tensor var_2446 = const()[name = tensor("op_2446"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_37_cast_fp16 = reshape(shape = var_2446, x = var_2445_cast_fp16)[name = tensor("matrix_bd_37_cast_fp16")]; tensor matrix_ac_19_transpose_x_0 = const()[name = tensor("matrix_ac_19_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_19_transpose_y_0 = const()[name = tensor("matrix_ac_19_transpose_y_0"), val = tensor(false)]; tensor transpose_114_perm_0 = const()[name = tensor("transpose_114_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_115_perm_0 = const()[name = tensor("transpose_115_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_115 = transpose(perm = transpose_115_perm_0, x = k_37_cast_fp16)[name = tensor("transpose_279")]; tensor transpose_114 = transpose(perm = transpose_114_perm_0, x = var_2429_cast_fp16)[name = tensor("transpose_280")]; tensor matrix_ac_19_cast_fp16 = matmul(transpose_x = matrix_ac_19_transpose_x_0, transpose_y = matrix_ac_19_transpose_y_0, x = transpose_114, y = transpose_115)[name = tensor("matrix_ac_19_cast_fp16")]; tensor matrix_bd_39_begin_0 = const()[name = tensor("matrix_bd_39_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_39_end_0 = const()[name = tensor("matrix_bd_39_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_39_end_mask_0 = const()[name = tensor("matrix_bd_39_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_39_cast_fp16 = slice_by_index(begin = matrix_bd_39_begin_0, end = matrix_bd_39_end_0, end_mask = matrix_bd_39_end_mask_0, x = matrix_bd_37_cast_fp16)[name = tensor("matrix_bd_39_cast_fp16")]; tensor var_2455_cast_fp16 = add(x = matrix_ac_19_cast_fp16, y = matrix_bd_39_cast_fp16)[name = tensor("op_2455_cast_fp16")]; tensor _inversed_scores_37_y_0_to_fp16 = const()[name = tensor("_inversed_scores_37_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_37_cast_fp16 = mul(x = var_2455_cast_fp16, y = _inversed_scores_37_y_0_to_fp16)[name = tensor("_inversed_scores_37_cast_fp16")]; tensor scores_39_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_37_cast_fp16, cond = mask_11)[name = tensor("scores_39_cast_fp16")]; tensor var_2461_cast_fp16 = softmax(axis = var_59, x = scores_39_cast_fp16)[name = tensor("op_2461_cast_fp16")]; tensor input_509_cast_fp16 = select(a = var_44_to_fp16, b = var_2461_cast_fp16, cond = mask_11)[name = tensor("input_509_cast_fp16")]; tensor x_247_transpose_x_0 = const()[name = tensor("x_247_transpose_x_0"), val = tensor(false)]; tensor x_247_transpose_y_0 = const()[name = tensor("x_247_transpose_y_0"), val = tensor(false)]; tensor value_27_cast_fp16 = transpose(perm = value_27_perm_0, x = v_19_cast_fp16)[name = tensor("transpose_278")]; tensor x_247_cast_fp16 = matmul(transpose_x = x_247_transpose_x_0, transpose_y = x_247_transpose_y_0, x = input_509_cast_fp16, y = value_27_cast_fp16)[name = tensor("x_247_cast_fp16")]; tensor var_2465_perm_0 = const()[name = tensor("op_2465_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2466 = const()[name = tensor("op_2466"), val = tensor([1, -1, 1024])]; tensor var_2465_cast_fp16 = transpose(perm = var_2465_perm_0, x = x_247_cast_fp16)[name = tensor("transpose_277")]; tensor input_511_cast_fp16 = reshape(shape = var_2466, x = var_2465_cast_fp16)[name = tensor("input_511_cast_fp16")]; tensor encoder_layers_9_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198310208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(199096704))), name = tensor("encoder_layers_9_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_9_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(199096896)))]; tensor linear_88_cast_fp16 = linear(bias = encoder_layers_9_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_9_self_attn_linear_out_weight_to_fp16_palettized, x = input_511_cast_fp16)[name = tensor("linear_88_cast_fp16")]; tensor input_515_cast_fp16 = add(x = input_505_cast_fp16, y = linear_88_cast_fp16)[name = tensor("input_515_cast_fp16")]; tensor x_251_axes_0 = const()[name = tensor("x_251_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(199099008)))]; tensor encoder_layers_9_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(199101120)))]; tensor x_251_cast_fp16 = layer_norm(axes = x_251_axes_0, beta = encoder_layers_9_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_9_norm_conv_weight_to_fp16, x = input_515_cast_fp16)[name = tensor("x_251_cast_fp16")]; tensor input_517_perm_0 = const()[name = tensor("input_517_perm_0"), val = tensor([0, 2, 1])]; tensor input_519_pad_type_0 = const()[name = tensor("input_519_pad_type_0"), val = tensor("valid")]; tensor input_519_strides_0 = const()[name = tensor("input_519_strides_0"), val = tensor([1])]; tensor input_519_pad_0 = const()[name = tensor("input_519_pad_0"), val = tensor([0, 0])]; tensor input_519_dilations_0 = const()[name = tensor("input_519_dilations_0"), val = tensor([1])]; tensor input_519_groups_0 = const()[name = tensor("input_519_groups_0"), val = tensor(1)]; tensor encoder_layers_9_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_9_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(199103232))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201200448))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_517_cast_fp16 = transpose(perm = input_517_perm_0, x = x_251_cast_fp16)[name = tensor("transpose_276")]; tensor input_519_cast_fp16 = conv(dilations = input_519_dilations_0, groups = input_519_groups_0, pad = input_519_pad_0, pad_type = input_519_pad_type_0, strides = input_519_strides_0, weight = encoder_layers_9_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_517_cast_fp16)[name = tensor("input_519_cast_fp16")]; tensor x_253_split_num_splits_0 = const()[name = tensor("x_253_split_num_splits_0"), val = tensor(2)]; tensor x_253_split_axis_0 = const()[name = tensor("x_253_split_axis_0"), val = tensor(1)]; tensor x_253_split_cast_fp16_0, tensor x_253_split_cast_fp16_1 = split(axis = x_253_split_axis_0, num_splits = x_253_split_num_splits_0, x = input_519_cast_fp16)[name = tensor("x_253_split_cast_fp16")]; tensor x_253_split_1_sigmoid_cast_fp16 = sigmoid(x = x_253_split_cast_fp16_1)[name = tensor("x_253_split_1_sigmoid_cast_fp16")]; tensor x_253_cast_fp16 = mul(x = x_253_split_cast_fp16_0, y = x_253_split_1_sigmoid_cast_fp16)[name = tensor("x_253_cast_fp16")]; tensor input_521_cast_fp16 = select(a = var_44_to_fp16, b = x_253_cast_fp16, cond = var_575)[name = tensor("input_521_cast_fp16")]; tensor new_x_39_interleave_0 = const()[name = tensor("new_x_39_interleave_0"), val = tensor(false)]; tensor new_x_39_cast_fp16 = concat(axis = var_59, interleave = new_x_39_interleave_0, values = (cache_39_cast_fp16, input_521_cast_fp16))[name = tensor("new_x_39_cast_fp16")]; tensor var_2505_begin_0 = const()[name = tensor("op_2505_begin_0"), val = tensor([0, 0, 7])]; tensor var_2505_end_0 = const()[name = tensor("op_2505_end_0"), val = tensor([1, 1024, 15])]; tensor var_2505_end_mask_0 = const()[name = tensor("op_2505_end_mask_0"), val = tensor([true, true, true])]; tensor var_2505_cast_fp16 = slice_by_index(begin = var_2505_begin_0, end = var_2505_end_0, end_mask = var_2505_end_mask_0, x = new_x_39_cast_fp16)[name = tensor("op_2505_cast_fp16")]; tensor x_255_pad_type_0 = const()[name = tensor("x_255_pad_type_0"), val = tensor("valid")]; tensor x_255_groups_0 = const()[name = tensor("x_255_groups_0"), val = tensor(1024)]; tensor x_255_strides_0 = const()[name = tensor("x_255_strides_0"), val = tensor([1])]; tensor x_255_pad_0 = const()[name = tensor("x_255_pad_0"), val = tensor([0, 0])]; tensor x_255_dilations_0 = const()[name = tensor("x_255_dilations_0"), val = tensor([1])]; tensor encoder_layers_9_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_9_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201204608))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201213888))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_255_cast_fp16 = conv(dilations = x_255_dilations_0, groups = x_255_groups_0, pad = x_255_pad_0, pad_type = x_255_pad_type_0, strides = x_255_strides_0, weight = encoder_layers_9_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_39_cast_fp16)[name = tensor("x_255_cast_fp16")]; tensor input_523_perm_0 = const()[name = tensor("input_523_perm_0"), val = tensor([0, 2, 1])]; tensor x_257_axes_0 = const()[name = tensor("x_257_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_9_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201216000)))]; tensor encoder_layers_9_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_9_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201218112)))]; tensor input_523_cast_fp16 = transpose(perm = input_523_perm_0, x = x_255_cast_fp16)[name = tensor("transpose_275")]; tensor x_257_cast_fp16 = layer_norm(axes = x_257_axes_0, beta = encoder_layers_9_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_9_conv_batch_norm_weight_to_fp16, x = input_523_cast_fp16)[name = tensor("x_257_cast_fp16")]; tensor input_525_perm_0 = const()[name = tensor("input_525_perm_0"), val = tensor([0, 2, 1])]; tensor input_525_cast_fp16 = transpose(perm = input_525_perm_0, x = x_257_cast_fp16)[name = tensor("transpose_274")]; tensor input_527_cast_fp16 = silu(x = input_525_cast_fp16)[name = tensor("input_527_cast_fp16")]; tensor x_259_pad_type_0 = const()[name = tensor("x_259_pad_type_0"), val = tensor("valid")]; tensor x_259_strides_0 = const()[name = tensor("x_259_strides_0"), val = tensor([1])]; tensor x_259_pad_0 = const()[name = tensor("x_259_pad_0"), val = tensor([0, 0])]; tensor x_259_dilations_0 = const()[name = tensor("x_259_dilations_0"), val = tensor([1])]; tensor x_259_groups_0 = const()[name = tensor("x_259_groups_0"), val = tensor(1)]; tensor encoder_layers_9_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_9_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201220224))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202268864))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_259_cast_fp16 = conv(dilations = x_259_dilations_0, groups = x_259_groups_0, pad = x_259_pad_0, pad_type = x_259_pad_type_0, strides = x_259_strides_0, weight = encoder_layers_9_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_527_cast_fp16)[name = tensor("x_259_cast_fp16")]; tensor input_529_perm_0 = const()[name = tensor("input_529_perm_0"), val = tensor([0, 2, 1])]; tensor input_529_cast_fp16 = transpose(perm = input_529_perm_0, x = x_259_cast_fp16)[name = tensor("transpose_273")]; tensor input_531_cast_fp16 = add(x = input_515_cast_fp16, y = input_529_cast_fp16)[name = tensor("input_531_cast_fp16")]; tensor input_533_axes_0 = const()[name = tensor("input_533_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202270976)))]; tensor encoder_layers_9_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202273088)))]; tensor input_533_cast_fp16 = layer_norm(axes = input_533_axes_0, beta = encoder_layers_9_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_9_norm_feed_forward2_weight_to_fp16, x = input_531_cast_fp16)[name = tensor("input_533_cast_fp16")]; tensor encoder_layers_9_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202275200))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(205420992))), name = tensor("encoder_layers_9_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_9_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_9_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(205421184)))]; tensor linear_89_cast_fp16 = linear(bias = encoder_layers_9_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_9_feed_forward2_linear1_weight_to_fp16_palettized, x = input_533_cast_fp16)[name = tensor("linear_89_cast_fp16")]; tensor input_537_cast_fp16 = silu(x = linear_89_cast_fp16)[name = tensor("input_537_cast_fp16")]; tensor encoder_layers_9_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(205429440))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208575232))), name = tensor("encoder_layers_9_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_9_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_9_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208575424)))]; tensor linear_90_cast_fp16 = linear(bias = encoder_layers_9_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_9_feed_forward2_linear2_weight_to_fp16_palettized, x = input_537_cast_fp16)[name = tensor("linear_90_cast_fp16")]; tensor var_2548_to_fp16 = const()[name = tensor("op_2548_to_fp16"), val = tensor(0x1p-1)]; tensor var_2549_cast_fp16 = mul(x = linear_90_cast_fp16, y = var_2548_to_fp16)[name = tensor("op_2549_cast_fp16")]; tensor input_543_cast_fp16 = add(x = input_531_cast_fp16, y = var_2549_cast_fp16)[name = tensor("input_543_cast_fp16")]; tensor input_545_axes_0 = const()[name = tensor("input_545_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208577536)))]; tensor encoder_layers_9_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208579648)))]; tensor input_545_cast_fp16 = layer_norm(axes = input_545_axes_0, beta = encoder_layers_9_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_9_norm_out_weight_to_fp16, x = input_543_cast_fp16)[name = tensor("input_545_cast_fp16")]; tensor cache_41_begin_0 = const()[name = tensor("cache_41_begin_0"), val = tensor([10, 0, 0, 0])]; tensor cache_41_end_0 = const()[name = tensor("cache_41_end_0"), val = tensor([11, 1, 42, 1024])]; tensor cache_41_end_mask_0 = const()[name = tensor("cache_41_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_41_squeeze_mask_0 = const()[name = tensor("cache_41_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_41_cast_fp16 = slice_by_index(begin = cache_41_begin_0, end = cache_41_end_0, end_mask = cache_41_end_mask_0, squeeze_mask = cache_41_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_41_cast_fp16")]; tensor cache_43_begin_0 = const()[name = tensor("cache_43_begin_0"), val = tensor([10, 0, 0, 0])]; tensor cache_43_end_0 = const()[name = tensor("cache_43_end_0"), val = tensor([11, 1, 1024, 8])]; tensor cache_43_end_mask_0 = const()[name = tensor("cache_43_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_43_squeeze_mask_0 = const()[name = tensor("cache_43_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_43_cast_fp16 = slice_by_index(begin = cache_43_begin_0, end = cache_43_end_0, end_mask = cache_43_end_mask_0, squeeze_mask = cache_43_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_43_cast_fp16")]; tensor input_547_axes_0 = const()[name = tensor("input_547_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208581760)))]; tensor encoder_layers_10_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208583872)))]; tensor input_547_cast_fp16 = layer_norm(axes = input_547_axes_0, beta = encoder_layers_10_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_10_norm_feed_forward1_weight_to_fp16, x = input_545_cast_fp16)[name = tensor("input_547_cast_fp16")]; tensor encoder_layers_10_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208585984))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211731776))), name = tensor("encoder_layers_10_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_10_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_10_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211731968)))]; tensor linear_91_cast_fp16 = linear(bias = encoder_layers_10_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_10_feed_forward1_linear1_weight_to_fp16_palettized, x = input_547_cast_fp16)[name = tensor("linear_91_cast_fp16")]; tensor input_551_cast_fp16 = silu(x = linear_91_cast_fp16)[name = tensor("input_551_cast_fp16")]; tensor encoder_layers_10_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211740224))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214886016))), name = tensor("encoder_layers_10_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_10_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_10_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214886208)))]; tensor linear_92_cast_fp16 = linear(bias = encoder_layers_10_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_10_feed_forward1_linear2_weight_to_fp16_palettized, x = input_551_cast_fp16)[name = tensor("linear_92_cast_fp16")]; tensor var_2585_to_fp16 = const()[name = tensor("op_2585_to_fp16"), val = tensor(0x1p-1)]; tensor var_2586_cast_fp16 = mul(x = linear_92_cast_fp16, y = var_2585_to_fp16)[name = tensor("op_2586_cast_fp16")]; tensor input_557_cast_fp16 = add(x = input_545_cast_fp16, y = var_2586_cast_fp16)[name = tensor("input_557_cast_fp16")]; tensor key_21_axes_0 = const()[name = tensor("key_21_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214888320)))]; tensor encoder_layers_10_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214890432)))]; tensor key_21_cast_fp16 = layer_norm(axes = key_21_axes_0, beta = encoder_layers_10_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_10_norm_self_att_weight_to_fp16, x = input_557_cast_fp16)[name = tensor("key_21_cast_fp16")]; tensor input_559_interleave_0 = const()[name = tensor("input_559_interleave_0"), val = tensor(false)]; tensor input_559_cast_fp16 = concat(axis = var_68, interleave = input_559_interleave_0, values = (cache_41_cast_fp16, key_21_cast_fp16))[name = tensor("input_559_cast_fp16")]; tensor var_2608_begin_0 = const()[name = tensor("op_2608_begin_0"), val = tensor([0, 7, 0])]; tensor var_2608_end_0 = const()[name = tensor("op_2608_end_0"), val = tensor([1, 42, 1024])]; tensor var_2608_end_mask_0 = const()[name = tensor("op_2608_end_mask_0"), val = tensor([true, true, true])]; tensor var_2608_cast_fp16 = slice_by_index(begin = var_2608_begin_0, end = var_2608_end_0, end_mask = var_2608_end_mask_0, x = cache_41_cast_fp16)[name = tensor("op_2608_cast_fp16")]; tensor var_2614_interleave_0 = const()[name = tensor("op_2614_interleave_0"), val = tensor(false)]; tensor var_2614_cast_fp16 = concat(axis = var_68, interleave = var_2614_interleave_0, values = (var_2608_cast_fp16, key_21_cast_fp16))[name = tensor("op_2614_cast_fp16")]; tensor encoder_layers_10_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214892544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215679040))), name = tensor("encoder_layers_10_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_10_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215679232)))]; tensor linear_93_cast_fp16 = linear(bias = encoder_layers_10_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_10_self_attn_linear_q_weight_to_fp16_palettized, x = key_21_cast_fp16)[name = tensor("linear_93_cast_fp16")]; tensor var_2619 = const()[name = tensor("op_2619"), val = tensor([1, -1, 8, 128])]; tensor q_61_cast_fp16 = reshape(shape = var_2619, x = linear_93_cast_fp16)[name = tensor("q_61_cast_fp16")]; tensor encoder_layers_10_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215681344))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(216467840))), name = tensor("encoder_layers_10_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_10_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(216468032)))]; tensor linear_94_cast_fp16 = linear(bias = encoder_layers_10_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_10_self_attn_linear_k_weight_to_fp16_palettized, x = input_559_cast_fp16)[name = tensor("linear_94_cast_fp16")]; tensor var_2624 = const()[name = tensor("op_2624"), val = tensor([1, -1, 8, 128])]; tensor k_41_cast_fp16 = reshape(shape = var_2624, x = linear_94_cast_fp16)[name = tensor("k_41_cast_fp16")]; tensor encoder_layers_10_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(216470144))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217256640))), name = tensor("encoder_layers_10_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_10_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217256832)))]; tensor linear_95_cast_fp16 = linear(bias = encoder_layers_10_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_10_self_attn_linear_v_weight_to_fp16_palettized, x = input_559_cast_fp16)[name = tensor("linear_95_cast_fp16")]; tensor var_2629 = const()[name = tensor("op_2629"), val = tensor([1, -1, 8, 128])]; tensor v_21_cast_fp16 = reshape(shape = var_2629, x = linear_95_cast_fp16)[name = tensor("v_21_cast_fp16")]; tensor value_29_perm_0 = const()[name = tensor("value_29_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_10_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217258944)))]; tensor var_2642_cast_fp16 = add(x = q_61_cast_fp16, y = encoder_layers_10_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2642_cast_fp16")]; tensor encoder_layers_10_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217261056)))]; tensor var_2644_cast_fp16 = add(x = q_61_cast_fp16, y = encoder_layers_10_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2644_cast_fp16")]; tensor q_with_bias_v_21_perm_0 = const()[name = tensor("q_with_bias_v_21_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_267_transpose_x_0 = const()[name = tensor("x_267_transpose_x_0"), val = tensor(false)]; tensor x_267_transpose_y_0 = const()[name = tensor("x_267_transpose_y_0"), val = tensor(false)]; tensor op_2646_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_2646_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217263168))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217362752))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217362560)))]; tensor q_with_bias_v_21_cast_fp16 = transpose(perm = q_with_bias_v_21_perm_0, x = var_2644_cast_fp16)[name = tensor("transpose_272")]; tensor x_267_cast_fp16 = matmul(transpose_x = x_267_transpose_x_0, transpose_y = x_267_transpose_y_0, x = q_with_bias_v_21_cast_fp16, y = op_2646_to_fp16_quantized)[name = tensor("x_267_cast_fp16")]; tensor x_269_pad_0 = const()[name = tensor("x_269_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_269_mode_0 = const()[name = tensor("x_269_mode_0"), val = tensor("constant")]; tensor const_209_to_fp16 = const()[name = tensor("const_209_to_fp16"), val = tensor(0x0p+0)]; tensor x_269_cast_fp16 = pad(constant_val = const_209_to_fp16, mode = x_269_mode_0, pad = x_269_pad_0, x = x_267_cast_fp16)[name = tensor("x_269_cast_fp16")]; tensor var_2654 = const()[name = tensor("op_2654"), val = tensor([1, 8, -1, 7])]; tensor x_271_cast_fp16 = reshape(shape = var_2654, x = x_269_cast_fp16)[name = tensor("x_271_cast_fp16")]; tensor var_2658_begin_0 = const()[name = tensor("op_2658_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2658_end_0 = const()[name = tensor("op_2658_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_2658_end_mask_0 = const()[name = tensor("op_2658_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2658_cast_fp16 = slice_by_index(begin = var_2658_begin_0, end = var_2658_end_0, end_mask = var_2658_end_mask_0, x = x_271_cast_fp16)[name = tensor("op_2658_cast_fp16")]; tensor var_2659 = const()[name = tensor("op_2659"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_41_cast_fp16 = reshape(shape = var_2659, x = var_2658_cast_fp16)[name = tensor("matrix_bd_41_cast_fp16")]; tensor matrix_ac_21_transpose_x_0 = const()[name = tensor("matrix_ac_21_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_21_transpose_y_0 = const()[name = tensor("matrix_ac_21_transpose_y_0"), val = tensor(false)]; tensor transpose_116_perm_0 = const()[name = tensor("transpose_116_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_117_perm_0 = const()[name = tensor("transpose_117_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_117 = transpose(perm = transpose_117_perm_0, x = k_41_cast_fp16)[name = tensor("transpose_270")]; tensor transpose_116 = transpose(perm = transpose_116_perm_0, x = var_2642_cast_fp16)[name = tensor("transpose_271")]; tensor matrix_ac_21_cast_fp16 = matmul(transpose_x = matrix_ac_21_transpose_x_0, transpose_y = matrix_ac_21_transpose_y_0, x = transpose_116, y = transpose_117)[name = tensor("matrix_ac_21_cast_fp16")]; tensor matrix_bd_43_begin_0 = const()[name = tensor("matrix_bd_43_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_43_end_0 = const()[name = tensor("matrix_bd_43_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_43_end_mask_0 = const()[name = tensor("matrix_bd_43_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_43_cast_fp16 = slice_by_index(begin = matrix_bd_43_begin_0, end = matrix_bd_43_end_0, end_mask = matrix_bd_43_end_mask_0, x = matrix_bd_41_cast_fp16)[name = tensor("matrix_bd_43_cast_fp16")]; tensor var_2668_cast_fp16 = add(x = matrix_ac_21_cast_fp16, y = matrix_bd_43_cast_fp16)[name = tensor("op_2668_cast_fp16")]; tensor _inversed_scores_41_y_0_to_fp16 = const()[name = tensor("_inversed_scores_41_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_41_cast_fp16 = mul(x = var_2668_cast_fp16, y = _inversed_scores_41_y_0_to_fp16)[name = tensor("_inversed_scores_41_cast_fp16")]; tensor scores_43_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_41_cast_fp16, cond = mask_11)[name = tensor("scores_43_cast_fp16")]; tensor var_2674_cast_fp16 = softmax(axis = var_59, x = scores_43_cast_fp16)[name = tensor("op_2674_cast_fp16")]; tensor input_561_cast_fp16 = select(a = var_44_to_fp16, b = var_2674_cast_fp16, cond = mask_11)[name = tensor("input_561_cast_fp16")]; tensor x_273_transpose_x_0 = const()[name = tensor("x_273_transpose_x_0"), val = tensor(false)]; tensor x_273_transpose_y_0 = const()[name = tensor("x_273_transpose_y_0"), val = tensor(false)]; tensor value_29_cast_fp16 = transpose(perm = value_29_perm_0, x = v_21_cast_fp16)[name = tensor("transpose_269")]; tensor x_273_cast_fp16 = matmul(transpose_x = x_273_transpose_x_0, transpose_y = x_273_transpose_y_0, x = input_561_cast_fp16, y = value_29_cast_fp16)[name = tensor("x_273_cast_fp16")]; tensor var_2678_perm_0 = const()[name = tensor("op_2678_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2679 = const()[name = tensor("op_2679"), val = tensor([1, -1, 1024])]; tensor var_2678_cast_fp16 = transpose(perm = var_2678_perm_0, x = x_273_cast_fp16)[name = tensor("transpose_268")]; tensor input_563_cast_fp16 = reshape(shape = var_2679, x = var_2678_cast_fp16)[name = tensor("input_563_cast_fp16")]; tensor encoder_layers_10_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217363072))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218149568))), name = tensor("encoder_layers_10_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_10_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218149760)))]; tensor linear_97_cast_fp16 = linear(bias = encoder_layers_10_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_10_self_attn_linear_out_weight_to_fp16_palettized, x = input_563_cast_fp16)[name = tensor("linear_97_cast_fp16")]; tensor input_567_cast_fp16 = add(x = input_557_cast_fp16, y = linear_97_cast_fp16)[name = tensor("input_567_cast_fp16")]; tensor x_277_axes_0 = const()[name = tensor("x_277_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218151872)))]; tensor encoder_layers_10_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218153984)))]; tensor x_277_cast_fp16 = layer_norm(axes = x_277_axes_0, beta = encoder_layers_10_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_10_norm_conv_weight_to_fp16, x = input_567_cast_fp16)[name = tensor("x_277_cast_fp16")]; tensor input_569_perm_0 = const()[name = tensor("input_569_perm_0"), val = tensor([0, 2, 1])]; tensor input_571_pad_type_0 = const()[name = tensor("input_571_pad_type_0"), val = tensor("valid")]; tensor input_571_strides_0 = const()[name = tensor("input_571_strides_0"), val = tensor([1])]; tensor input_571_pad_0 = const()[name = tensor("input_571_pad_0"), val = tensor([0, 0])]; tensor input_571_dilations_0 = const()[name = tensor("input_571_dilations_0"), val = tensor([1])]; tensor input_571_groups_0 = const()[name = tensor("input_571_groups_0"), val = tensor(1)]; tensor encoder_layers_10_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_10_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218156096))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220253312))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_569_cast_fp16 = transpose(perm = input_569_perm_0, x = x_277_cast_fp16)[name = tensor("transpose_267")]; tensor input_571_cast_fp16 = conv(dilations = input_571_dilations_0, groups = input_571_groups_0, pad = input_571_pad_0, pad_type = input_571_pad_type_0, strides = input_571_strides_0, weight = encoder_layers_10_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_569_cast_fp16)[name = tensor("input_571_cast_fp16")]; tensor x_279_split_num_splits_0 = const()[name = tensor("x_279_split_num_splits_0"), val = tensor(2)]; tensor x_279_split_axis_0 = const()[name = tensor("x_279_split_axis_0"), val = tensor(1)]; tensor x_279_split_cast_fp16_0, tensor x_279_split_cast_fp16_1 = split(axis = x_279_split_axis_0, num_splits = x_279_split_num_splits_0, x = input_571_cast_fp16)[name = tensor("x_279_split_cast_fp16")]; tensor x_279_split_1_sigmoid_cast_fp16 = sigmoid(x = x_279_split_cast_fp16_1)[name = tensor("x_279_split_1_sigmoid_cast_fp16")]; tensor x_279_cast_fp16 = mul(x = x_279_split_cast_fp16_0, y = x_279_split_1_sigmoid_cast_fp16)[name = tensor("x_279_cast_fp16")]; tensor input_573_cast_fp16 = select(a = var_44_to_fp16, b = x_279_cast_fp16, cond = var_575)[name = tensor("input_573_cast_fp16")]; tensor new_x_43_interleave_0 = const()[name = tensor("new_x_43_interleave_0"), val = tensor(false)]; tensor new_x_43_cast_fp16 = concat(axis = var_59, interleave = new_x_43_interleave_0, values = (cache_43_cast_fp16, input_573_cast_fp16))[name = tensor("new_x_43_cast_fp16")]; tensor var_2718_begin_0 = const()[name = tensor("op_2718_begin_0"), val = tensor([0, 0, 7])]; tensor var_2718_end_0 = const()[name = tensor("op_2718_end_0"), val = tensor([1, 1024, 15])]; tensor var_2718_end_mask_0 = const()[name = tensor("op_2718_end_mask_0"), val = tensor([true, true, true])]; tensor var_2718_cast_fp16 = slice_by_index(begin = var_2718_begin_0, end = var_2718_end_0, end_mask = var_2718_end_mask_0, x = new_x_43_cast_fp16)[name = tensor("op_2718_cast_fp16")]; tensor x_281_pad_type_0 = const()[name = tensor("x_281_pad_type_0"), val = tensor("valid")]; tensor x_281_groups_0 = const()[name = tensor("x_281_groups_0"), val = tensor(1024)]; tensor x_281_strides_0 = const()[name = tensor("x_281_strides_0"), val = tensor([1])]; tensor x_281_pad_0 = const()[name = tensor("x_281_pad_0"), val = tensor([0, 0])]; tensor x_281_dilations_0 = const()[name = tensor("x_281_dilations_0"), val = tensor([1])]; tensor encoder_layers_10_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_10_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220257472))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220266752))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_281_cast_fp16 = conv(dilations = x_281_dilations_0, groups = x_281_groups_0, pad = x_281_pad_0, pad_type = x_281_pad_type_0, strides = x_281_strides_0, weight = encoder_layers_10_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_43_cast_fp16)[name = tensor("x_281_cast_fp16")]; tensor input_575_perm_0 = const()[name = tensor("input_575_perm_0"), val = tensor([0, 2, 1])]; tensor x_283_axes_0 = const()[name = tensor("x_283_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_10_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220268864)))]; tensor encoder_layers_10_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_10_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220270976)))]; tensor input_575_cast_fp16 = transpose(perm = input_575_perm_0, x = x_281_cast_fp16)[name = tensor("transpose_266")]; tensor x_283_cast_fp16 = layer_norm(axes = x_283_axes_0, beta = encoder_layers_10_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_10_conv_batch_norm_weight_to_fp16, x = input_575_cast_fp16)[name = tensor("x_283_cast_fp16")]; tensor input_577_perm_0 = const()[name = tensor("input_577_perm_0"), val = tensor([0, 2, 1])]; tensor input_577_cast_fp16 = transpose(perm = input_577_perm_0, x = x_283_cast_fp16)[name = tensor("transpose_265")]; tensor input_579_cast_fp16 = silu(x = input_577_cast_fp16)[name = tensor("input_579_cast_fp16")]; tensor x_285_pad_type_0 = const()[name = tensor("x_285_pad_type_0"), val = tensor("valid")]; tensor x_285_strides_0 = const()[name = tensor("x_285_strides_0"), val = tensor([1])]; tensor x_285_pad_0 = const()[name = tensor("x_285_pad_0"), val = tensor([0, 0])]; tensor x_285_dilations_0 = const()[name = tensor("x_285_dilations_0"), val = tensor([1])]; tensor x_285_groups_0 = const()[name = tensor("x_285_groups_0"), val = tensor(1)]; tensor encoder_layers_10_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_10_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220273088))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(221321728))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_285_cast_fp16 = conv(dilations = x_285_dilations_0, groups = x_285_groups_0, pad = x_285_pad_0, pad_type = x_285_pad_type_0, strides = x_285_strides_0, weight = encoder_layers_10_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_579_cast_fp16)[name = tensor("x_285_cast_fp16")]; tensor input_581_perm_0 = const()[name = tensor("input_581_perm_0"), val = tensor([0, 2, 1])]; tensor input_581_cast_fp16 = transpose(perm = input_581_perm_0, x = x_285_cast_fp16)[name = tensor("transpose_264")]; tensor input_583_cast_fp16 = add(x = input_567_cast_fp16, y = input_581_cast_fp16)[name = tensor("input_583_cast_fp16")]; tensor input_585_axes_0 = const()[name = tensor("input_585_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(221323840)))]; tensor encoder_layers_10_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(221325952)))]; tensor input_585_cast_fp16 = layer_norm(axes = input_585_axes_0, beta = encoder_layers_10_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_10_norm_feed_forward2_weight_to_fp16, x = input_583_cast_fp16)[name = tensor("input_585_cast_fp16")]; tensor encoder_layers_10_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(221328064))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224473856))), name = tensor("encoder_layers_10_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_10_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_10_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224474048)))]; tensor linear_98_cast_fp16 = linear(bias = encoder_layers_10_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_10_feed_forward2_linear1_weight_to_fp16_palettized, x = input_585_cast_fp16)[name = tensor("linear_98_cast_fp16")]; tensor input_589_cast_fp16 = silu(x = linear_98_cast_fp16)[name = tensor("input_589_cast_fp16")]; tensor encoder_layers_10_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224482304))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227628096))), name = tensor("encoder_layers_10_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_10_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_10_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227628288)))]; tensor linear_99_cast_fp16 = linear(bias = encoder_layers_10_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_10_feed_forward2_linear2_weight_to_fp16_palettized, x = input_589_cast_fp16)[name = tensor("linear_99_cast_fp16")]; tensor var_2761_to_fp16 = const()[name = tensor("op_2761_to_fp16"), val = tensor(0x1p-1)]; tensor var_2762_cast_fp16 = mul(x = linear_99_cast_fp16, y = var_2761_to_fp16)[name = tensor("op_2762_cast_fp16")]; tensor input_595_cast_fp16 = add(x = input_583_cast_fp16, y = var_2762_cast_fp16)[name = tensor("input_595_cast_fp16")]; tensor input_597_axes_0 = const()[name = tensor("input_597_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227630400)))]; tensor encoder_layers_10_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227632512)))]; tensor input_597_cast_fp16 = layer_norm(axes = input_597_axes_0, beta = encoder_layers_10_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_10_norm_out_weight_to_fp16, x = input_595_cast_fp16)[name = tensor("input_597_cast_fp16")]; tensor cache_45_begin_0 = const()[name = tensor("cache_45_begin_0"), val = tensor([11, 0, 0, 0])]; tensor cache_45_end_0 = const()[name = tensor("cache_45_end_0"), val = tensor([12, 1, 42, 1024])]; tensor cache_45_end_mask_0 = const()[name = tensor("cache_45_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_45_squeeze_mask_0 = const()[name = tensor("cache_45_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_45_cast_fp16 = slice_by_index(begin = cache_45_begin_0, end = cache_45_end_0, end_mask = cache_45_end_mask_0, squeeze_mask = cache_45_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_45_cast_fp16")]; tensor cache_47_begin_0 = const()[name = tensor("cache_47_begin_0"), val = tensor([11, 0, 0, 0])]; tensor cache_47_end_0 = const()[name = tensor("cache_47_end_0"), val = tensor([12, 1, 1024, 8])]; tensor cache_47_end_mask_0 = const()[name = tensor("cache_47_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_47_squeeze_mask_0 = const()[name = tensor("cache_47_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_47_cast_fp16 = slice_by_index(begin = cache_47_begin_0, end = cache_47_end_0, end_mask = cache_47_end_mask_0, squeeze_mask = cache_47_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_47_cast_fp16")]; tensor input_599_axes_0 = const()[name = tensor("input_599_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227634624)))]; tensor encoder_layers_11_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227636736)))]; tensor input_599_cast_fp16 = layer_norm(axes = input_599_axes_0, beta = encoder_layers_11_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_11_norm_feed_forward1_weight_to_fp16, x = input_597_cast_fp16)[name = tensor("input_599_cast_fp16")]; tensor encoder_layers_11_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227638848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(230784640))), name = tensor("encoder_layers_11_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_11_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_11_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(230784832)))]; tensor linear_100_cast_fp16 = linear(bias = encoder_layers_11_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_11_feed_forward1_linear1_weight_to_fp16_palettized, x = input_599_cast_fp16)[name = tensor("linear_100_cast_fp16")]; tensor input_603_cast_fp16 = silu(x = linear_100_cast_fp16)[name = tensor("input_603_cast_fp16")]; tensor encoder_layers_11_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(230793088))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233938880))), name = tensor("encoder_layers_11_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_11_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_11_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233939072)))]; tensor linear_101_cast_fp16 = linear(bias = encoder_layers_11_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_11_feed_forward1_linear2_weight_to_fp16_palettized, x = input_603_cast_fp16)[name = tensor("linear_101_cast_fp16")]; tensor var_2798_to_fp16 = const()[name = tensor("op_2798_to_fp16"), val = tensor(0x1p-1)]; tensor var_2799_cast_fp16 = mul(x = linear_101_cast_fp16, y = var_2798_to_fp16)[name = tensor("op_2799_cast_fp16")]; tensor input_609_cast_fp16 = add(x = input_597_cast_fp16, y = var_2799_cast_fp16)[name = tensor("input_609_cast_fp16")]; tensor key_23_axes_0 = const()[name = tensor("key_23_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233941184)))]; tensor encoder_layers_11_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233943296)))]; tensor key_23_cast_fp16 = layer_norm(axes = key_23_axes_0, beta = encoder_layers_11_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_11_norm_self_att_weight_to_fp16, x = input_609_cast_fp16)[name = tensor("key_23_cast_fp16")]; tensor input_611_interleave_0 = const()[name = tensor("input_611_interleave_0"), val = tensor(false)]; tensor input_611_cast_fp16 = concat(axis = var_68, interleave = input_611_interleave_0, values = (cache_45_cast_fp16, key_23_cast_fp16))[name = tensor("input_611_cast_fp16")]; tensor var_2821_begin_0 = const()[name = tensor("op_2821_begin_0"), val = tensor([0, 7, 0])]; tensor var_2821_end_0 = const()[name = tensor("op_2821_end_0"), val = tensor([1, 42, 1024])]; tensor var_2821_end_mask_0 = const()[name = tensor("op_2821_end_mask_0"), val = tensor([true, true, true])]; tensor var_2821_cast_fp16 = slice_by_index(begin = var_2821_begin_0, end = var_2821_end_0, end_mask = var_2821_end_mask_0, x = cache_45_cast_fp16)[name = tensor("op_2821_cast_fp16")]; tensor var_2827_interleave_0 = const()[name = tensor("op_2827_interleave_0"), val = tensor(false)]; tensor var_2827_cast_fp16 = concat(axis = var_68, interleave = var_2827_interleave_0, values = (var_2821_cast_fp16, key_23_cast_fp16))[name = tensor("op_2827_cast_fp16")]; tensor encoder_layers_11_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233945408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(234731904))), name = tensor("encoder_layers_11_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_11_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(234732096)))]; tensor linear_102_cast_fp16 = linear(bias = encoder_layers_11_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_11_self_attn_linear_q_weight_to_fp16_palettized, x = key_23_cast_fp16)[name = tensor("linear_102_cast_fp16")]; tensor var_2832 = const()[name = tensor("op_2832"), val = tensor([1, -1, 8, 128])]; tensor q_67_cast_fp16 = reshape(shape = var_2832, x = linear_102_cast_fp16)[name = tensor("q_67_cast_fp16")]; tensor encoder_layers_11_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(234734208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(235520704))), name = tensor("encoder_layers_11_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_11_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(235520896)))]; tensor linear_103_cast_fp16 = linear(bias = encoder_layers_11_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_11_self_attn_linear_k_weight_to_fp16_palettized, x = input_611_cast_fp16)[name = tensor("linear_103_cast_fp16")]; tensor var_2837 = const()[name = tensor("op_2837"), val = tensor([1, -1, 8, 128])]; tensor k_45_cast_fp16 = reshape(shape = var_2837, x = linear_103_cast_fp16)[name = tensor("k_45_cast_fp16")]; tensor encoder_layers_11_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(235523008))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236309504))), name = tensor("encoder_layers_11_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_11_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236309696)))]; tensor linear_104_cast_fp16 = linear(bias = encoder_layers_11_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_11_self_attn_linear_v_weight_to_fp16_palettized, x = input_611_cast_fp16)[name = tensor("linear_104_cast_fp16")]; tensor var_2842 = const()[name = tensor("op_2842"), val = tensor([1, -1, 8, 128])]; tensor v_23_cast_fp16 = reshape(shape = var_2842, x = linear_104_cast_fp16)[name = tensor("v_23_cast_fp16")]; tensor value_31_perm_0 = const()[name = tensor("value_31_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_11_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236311808)))]; tensor var_2855_cast_fp16 = add(x = q_67_cast_fp16, y = encoder_layers_11_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2855_cast_fp16")]; tensor encoder_layers_11_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236313920)))]; tensor var_2857_cast_fp16 = add(x = q_67_cast_fp16, y = encoder_layers_11_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2857_cast_fp16")]; tensor q_with_bias_v_23_perm_0 = const()[name = tensor("q_with_bias_v_23_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_293_transpose_x_0 = const()[name = tensor("x_293_transpose_x_0"), val = tensor(false)]; tensor x_293_transpose_y_0 = const()[name = tensor("x_293_transpose_y_0"), val = tensor(false)]; tensor op_2859_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_2859_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236316032))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236415616))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236415424)))]; tensor q_with_bias_v_23_cast_fp16 = transpose(perm = q_with_bias_v_23_perm_0, x = var_2857_cast_fp16)[name = tensor("transpose_263")]; tensor x_293_cast_fp16 = matmul(transpose_x = x_293_transpose_x_0, transpose_y = x_293_transpose_y_0, x = q_with_bias_v_23_cast_fp16, y = op_2859_to_fp16_quantized)[name = tensor("x_293_cast_fp16")]; tensor x_295_pad_0 = const()[name = tensor("x_295_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_295_mode_0 = const()[name = tensor("x_295_mode_0"), val = tensor("constant")]; tensor const_222_to_fp16 = const()[name = tensor("const_222_to_fp16"), val = tensor(0x0p+0)]; tensor x_295_cast_fp16 = pad(constant_val = const_222_to_fp16, mode = x_295_mode_0, pad = x_295_pad_0, x = x_293_cast_fp16)[name = tensor("x_295_cast_fp16")]; tensor var_2867 = const()[name = tensor("op_2867"), val = tensor([1, 8, -1, 7])]; tensor x_297_cast_fp16 = reshape(shape = var_2867, x = x_295_cast_fp16)[name = tensor("x_297_cast_fp16")]; tensor var_2871_begin_0 = const()[name = tensor("op_2871_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2871_end_0 = const()[name = tensor("op_2871_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_2871_end_mask_0 = const()[name = tensor("op_2871_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2871_cast_fp16 = slice_by_index(begin = var_2871_begin_0, end = var_2871_end_0, end_mask = var_2871_end_mask_0, x = x_297_cast_fp16)[name = tensor("op_2871_cast_fp16")]; tensor var_2872 = const()[name = tensor("op_2872"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_45_cast_fp16 = reshape(shape = var_2872, x = var_2871_cast_fp16)[name = tensor("matrix_bd_45_cast_fp16")]; tensor matrix_ac_23_transpose_x_0 = const()[name = tensor("matrix_ac_23_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_23_transpose_y_0 = const()[name = tensor("matrix_ac_23_transpose_y_0"), val = tensor(false)]; tensor transpose_118_perm_0 = const()[name = tensor("transpose_118_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_119_perm_0 = const()[name = tensor("transpose_119_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_119 = transpose(perm = transpose_119_perm_0, x = k_45_cast_fp16)[name = tensor("transpose_261")]; tensor transpose_118 = transpose(perm = transpose_118_perm_0, x = var_2855_cast_fp16)[name = tensor("transpose_262")]; tensor matrix_ac_23_cast_fp16 = matmul(transpose_x = matrix_ac_23_transpose_x_0, transpose_y = matrix_ac_23_transpose_y_0, x = transpose_118, y = transpose_119)[name = tensor("matrix_ac_23_cast_fp16")]; tensor matrix_bd_47_begin_0 = const()[name = tensor("matrix_bd_47_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_47_end_0 = const()[name = tensor("matrix_bd_47_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_47_end_mask_0 = const()[name = tensor("matrix_bd_47_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_47_cast_fp16 = slice_by_index(begin = matrix_bd_47_begin_0, end = matrix_bd_47_end_0, end_mask = matrix_bd_47_end_mask_0, x = matrix_bd_45_cast_fp16)[name = tensor("matrix_bd_47_cast_fp16")]; tensor var_2881_cast_fp16 = add(x = matrix_ac_23_cast_fp16, y = matrix_bd_47_cast_fp16)[name = tensor("op_2881_cast_fp16")]; tensor _inversed_scores_45_y_0_to_fp16 = const()[name = tensor("_inversed_scores_45_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_45_cast_fp16 = mul(x = var_2881_cast_fp16, y = _inversed_scores_45_y_0_to_fp16)[name = tensor("_inversed_scores_45_cast_fp16")]; tensor scores_47_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_45_cast_fp16, cond = mask_11)[name = tensor("scores_47_cast_fp16")]; tensor var_2887_cast_fp16 = softmax(axis = var_59, x = scores_47_cast_fp16)[name = tensor("op_2887_cast_fp16")]; tensor input_613_cast_fp16 = select(a = var_44_to_fp16, b = var_2887_cast_fp16, cond = mask_11)[name = tensor("input_613_cast_fp16")]; tensor x_299_transpose_x_0 = const()[name = tensor("x_299_transpose_x_0"), val = tensor(false)]; tensor x_299_transpose_y_0 = const()[name = tensor("x_299_transpose_y_0"), val = tensor(false)]; tensor value_31_cast_fp16 = transpose(perm = value_31_perm_0, x = v_23_cast_fp16)[name = tensor("transpose_260")]; tensor x_299_cast_fp16 = matmul(transpose_x = x_299_transpose_x_0, transpose_y = x_299_transpose_y_0, x = input_613_cast_fp16, y = value_31_cast_fp16)[name = tensor("x_299_cast_fp16")]; tensor var_2891_perm_0 = const()[name = tensor("op_2891_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2892 = const()[name = tensor("op_2892"), val = tensor([1, -1, 1024])]; tensor var_2891_cast_fp16 = transpose(perm = var_2891_perm_0, x = x_299_cast_fp16)[name = tensor("transpose_259")]; tensor input_615_cast_fp16 = reshape(shape = var_2892, x = var_2891_cast_fp16)[name = tensor("input_615_cast_fp16")]; tensor encoder_layers_11_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236415936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237202432))), name = tensor("encoder_layers_11_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_11_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237202624)))]; tensor linear_106_cast_fp16 = linear(bias = encoder_layers_11_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_11_self_attn_linear_out_weight_to_fp16_palettized, x = input_615_cast_fp16)[name = tensor("linear_106_cast_fp16")]; tensor input_619_cast_fp16 = add(x = input_609_cast_fp16, y = linear_106_cast_fp16)[name = tensor("input_619_cast_fp16")]; tensor x_303_axes_0 = const()[name = tensor("x_303_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237204736)))]; tensor encoder_layers_11_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237206848)))]; tensor x_303_cast_fp16 = layer_norm(axes = x_303_axes_0, beta = encoder_layers_11_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_11_norm_conv_weight_to_fp16, x = input_619_cast_fp16)[name = tensor("x_303_cast_fp16")]; tensor input_621_perm_0 = const()[name = tensor("input_621_perm_0"), val = tensor([0, 2, 1])]; tensor input_623_pad_type_0 = const()[name = tensor("input_623_pad_type_0"), val = tensor("valid")]; tensor input_623_strides_0 = const()[name = tensor("input_623_strides_0"), val = tensor([1])]; tensor input_623_pad_0 = const()[name = tensor("input_623_pad_0"), val = tensor([0, 0])]; tensor input_623_dilations_0 = const()[name = tensor("input_623_dilations_0"), val = tensor([1])]; tensor input_623_groups_0 = const()[name = tensor("input_623_groups_0"), val = tensor(1)]; tensor encoder_layers_11_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_11_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237208960))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(239306176))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_621_cast_fp16 = transpose(perm = input_621_perm_0, x = x_303_cast_fp16)[name = tensor("transpose_258")]; tensor input_623_cast_fp16 = conv(dilations = input_623_dilations_0, groups = input_623_groups_0, pad = input_623_pad_0, pad_type = input_623_pad_type_0, strides = input_623_strides_0, weight = encoder_layers_11_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_621_cast_fp16)[name = tensor("input_623_cast_fp16")]; tensor x_305_split_num_splits_0 = const()[name = tensor("x_305_split_num_splits_0"), val = tensor(2)]; tensor x_305_split_axis_0 = const()[name = tensor("x_305_split_axis_0"), val = tensor(1)]; tensor x_305_split_cast_fp16_0, tensor x_305_split_cast_fp16_1 = split(axis = x_305_split_axis_0, num_splits = x_305_split_num_splits_0, x = input_623_cast_fp16)[name = tensor("x_305_split_cast_fp16")]; tensor x_305_split_1_sigmoid_cast_fp16 = sigmoid(x = x_305_split_cast_fp16_1)[name = tensor("x_305_split_1_sigmoid_cast_fp16")]; tensor x_305_cast_fp16 = mul(x = x_305_split_cast_fp16_0, y = x_305_split_1_sigmoid_cast_fp16)[name = tensor("x_305_cast_fp16")]; tensor input_625_cast_fp16 = select(a = var_44_to_fp16, b = x_305_cast_fp16, cond = var_575)[name = tensor("input_625_cast_fp16")]; tensor new_x_47_interleave_0 = const()[name = tensor("new_x_47_interleave_0"), val = tensor(false)]; tensor new_x_47_cast_fp16 = concat(axis = var_59, interleave = new_x_47_interleave_0, values = (cache_47_cast_fp16, input_625_cast_fp16))[name = tensor("new_x_47_cast_fp16")]; tensor var_2931_begin_0 = const()[name = tensor("op_2931_begin_0"), val = tensor([0, 0, 7])]; tensor var_2931_end_0 = const()[name = tensor("op_2931_end_0"), val = tensor([1, 1024, 15])]; tensor var_2931_end_mask_0 = const()[name = tensor("op_2931_end_mask_0"), val = tensor([true, true, true])]; tensor var_2931_cast_fp16 = slice_by_index(begin = var_2931_begin_0, end = var_2931_end_0, end_mask = var_2931_end_mask_0, x = new_x_47_cast_fp16)[name = tensor("op_2931_cast_fp16")]; tensor x_307_pad_type_0 = const()[name = tensor("x_307_pad_type_0"), val = tensor("valid")]; tensor x_307_groups_0 = const()[name = tensor("x_307_groups_0"), val = tensor(1024)]; tensor x_307_strides_0 = const()[name = tensor("x_307_strides_0"), val = tensor([1])]; tensor x_307_pad_0 = const()[name = tensor("x_307_pad_0"), val = tensor([0, 0])]; tensor x_307_dilations_0 = const()[name = tensor("x_307_dilations_0"), val = tensor([1])]; tensor encoder_layers_11_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_11_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(239310336))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(239319616))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_307_cast_fp16 = conv(dilations = x_307_dilations_0, groups = x_307_groups_0, pad = x_307_pad_0, pad_type = x_307_pad_type_0, strides = x_307_strides_0, weight = encoder_layers_11_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_47_cast_fp16)[name = tensor("x_307_cast_fp16")]; tensor input_627_perm_0 = const()[name = tensor("input_627_perm_0"), val = tensor([0, 2, 1])]; tensor x_309_axes_0 = const()[name = tensor("x_309_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_11_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(239321728)))]; tensor encoder_layers_11_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_11_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(239323840)))]; tensor input_627_cast_fp16 = transpose(perm = input_627_perm_0, x = x_307_cast_fp16)[name = tensor("transpose_257")]; tensor x_309_cast_fp16 = layer_norm(axes = x_309_axes_0, beta = encoder_layers_11_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_11_conv_batch_norm_weight_to_fp16, x = input_627_cast_fp16)[name = tensor("x_309_cast_fp16")]; tensor input_629_perm_0 = const()[name = tensor("input_629_perm_0"), val = tensor([0, 2, 1])]; tensor input_629_cast_fp16 = transpose(perm = input_629_perm_0, x = x_309_cast_fp16)[name = tensor("transpose_256")]; tensor input_631_cast_fp16 = silu(x = input_629_cast_fp16)[name = tensor("input_631_cast_fp16")]; tensor x_311_pad_type_0 = const()[name = tensor("x_311_pad_type_0"), val = tensor("valid")]; tensor x_311_strides_0 = const()[name = tensor("x_311_strides_0"), val = tensor([1])]; tensor x_311_pad_0 = const()[name = tensor("x_311_pad_0"), val = tensor([0, 0])]; tensor x_311_dilations_0 = const()[name = tensor("x_311_dilations_0"), val = tensor([1])]; tensor x_311_groups_0 = const()[name = tensor("x_311_groups_0"), val = tensor(1)]; tensor encoder_layers_11_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_11_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(239325952))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240374592))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_311_cast_fp16 = conv(dilations = x_311_dilations_0, groups = x_311_groups_0, pad = x_311_pad_0, pad_type = x_311_pad_type_0, strides = x_311_strides_0, weight = encoder_layers_11_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_631_cast_fp16)[name = tensor("x_311_cast_fp16")]; tensor input_633_perm_0 = const()[name = tensor("input_633_perm_0"), val = tensor([0, 2, 1])]; tensor input_633_cast_fp16 = transpose(perm = input_633_perm_0, x = x_311_cast_fp16)[name = tensor("transpose_255")]; tensor input_635_cast_fp16 = add(x = input_619_cast_fp16, y = input_633_cast_fp16)[name = tensor("input_635_cast_fp16")]; tensor input_637_axes_0 = const()[name = tensor("input_637_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240376704)))]; tensor encoder_layers_11_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240378816)))]; tensor input_637_cast_fp16 = layer_norm(axes = input_637_axes_0, beta = encoder_layers_11_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_11_norm_feed_forward2_weight_to_fp16, x = input_635_cast_fp16)[name = tensor("input_637_cast_fp16")]; tensor encoder_layers_11_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240380928))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(243526720))), name = tensor("encoder_layers_11_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_11_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_11_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(243526912)))]; tensor linear_107_cast_fp16 = linear(bias = encoder_layers_11_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_11_feed_forward2_linear1_weight_to_fp16_palettized, x = input_637_cast_fp16)[name = tensor("linear_107_cast_fp16")]; tensor input_641_cast_fp16 = silu(x = linear_107_cast_fp16)[name = tensor("input_641_cast_fp16")]; tensor encoder_layers_11_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(243535168))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246680960))), name = tensor("encoder_layers_11_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_11_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_11_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246681152)))]; tensor linear_108_cast_fp16 = linear(bias = encoder_layers_11_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_11_feed_forward2_linear2_weight_to_fp16_palettized, x = input_641_cast_fp16)[name = tensor("linear_108_cast_fp16")]; tensor var_2974_to_fp16 = const()[name = tensor("op_2974_to_fp16"), val = tensor(0x1p-1)]; tensor var_2975_cast_fp16 = mul(x = linear_108_cast_fp16, y = var_2974_to_fp16)[name = tensor("op_2975_cast_fp16")]; tensor input_647_cast_fp16 = add(x = input_635_cast_fp16, y = var_2975_cast_fp16)[name = tensor("input_647_cast_fp16")]; tensor input_649_axes_0 = const()[name = tensor("input_649_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246683264)))]; tensor encoder_layers_11_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246685376)))]; tensor input_649_cast_fp16 = layer_norm(axes = input_649_axes_0, beta = encoder_layers_11_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_11_norm_out_weight_to_fp16, x = input_647_cast_fp16)[name = tensor("input_649_cast_fp16")]; tensor cache_49_begin_0 = const()[name = tensor("cache_49_begin_0"), val = tensor([12, 0, 0, 0])]; tensor cache_49_end_0 = const()[name = tensor("cache_49_end_0"), val = tensor([13, 1, 42, 1024])]; tensor cache_49_end_mask_0 = const()[name = tensor("cache_49_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_49_squeeze_mask_0 = const()[name = tensor("cache_49_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_49_cast_fp16 = slice_by_index(begin = cache_49_begin_0, end = cache_49_end_0, end_mask = cache_49_end_mask_0, squeeze_mask = cache_49_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_49_cast_fp16")]; tensor cache_51_begin_0 = const()[name = tensor("cache_51_begin_0"), val = tensor([12, 0, 0, 0])]; tensor cache_51_end_0 = const()[name = tensor("cache_51_end_0"), val = tensor([13, 1, 1024, 8])]; tensor cache_51_end_mask_0 = const()[name = tensor("cache_51_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_51_squeeze_mask_0 = const()[name = tensor("cache_51_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_51_cast_fp16 = slice_by_index(begin = cache_51_begin_0, end = cache_51_end_0, end_mask = cache_51_end_mask_0, squeeze_mask = cache_51_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_51_cast_fp16")]; tensor input_651_axes_0 = const()[name = tensor("input_651_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246687488)))]; tensor encoder_layers_12_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246689600)))]; tensor input_651_cast_fp16 = layer_norm(axes = input_651_axes_0, beta = encoder_layers_12_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_12_norm_feed_forward1_weight_to_fp16, x = input_649_cast_fp16)[name = tensor("input_651_cast_fp16")]; tensor encoder_layers_12_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246691712))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(249837504))), name = tensor("encoder_layers_12_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_12_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_12_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(249837696)))]; tensor linear_109_cast_fp16 = linear(bias = encoder_layers_12_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_12_feed_forward1_linear1_weight_to_fp16_palettized, x = input_651_cast_fp16)[name = tensor("linear_109_cast_fp16")]; tensor input_655_cast_fp16 = silu(x = linear_109_cast_fp16)[name = tensor("input_655_cast_fp16")]; tensor encoder_layers_12_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(249845952))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252991744))), name = tensor("encoder_layers_12_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_12_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_12_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252991936)))]; tensor linear_110_cast_fp16 = linear(bias = encoder_layers_12_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_12_feed_forward1_linear2_weight_to_fp16_palettized, x = input_655_cast_fp16)[name = tensor("linear_110_cast_fp16")]; tensor var_3011_to_fp16 = const()[name = tensor("op_3011_to_fp16"), val = tensor(0x1p-1)]; tensor var_3012_cast_fp16 = mul(x = linear_110_cast_fp16, y = var_3011_to_fp16)[name = tensor("op_3012_cast_fp16")]; tensor input_661_cast_fp16 = add(x = input_649_cast_fp16, y = var_3012_cast_fp16)[name = tensor("input_661_cast_fp16")]; tensor key_25_axes_0 = const()[name = tensor("key_25_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252994048)))]; tensor encoder_layers_12_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252996160)))]; tensor key_25_cast_fp16 = layer_norm(axes = key_25_axes_0, beta = encoder_layers_12_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_12_norm_self_att_weight_to_fp16, x = input_661_cast_fp16)[name = tensor("key_25_cast_fp16")]; tensor input_663_interleave_0 = const()[name = tensor("input_663_interleave_0"), val = tensor(false)]; tensor input_663_cast_fp16 = concat(axis = var_68, interleave = input_663_interleave_0, values = (cache_49_cast_fp16, key_25_cast_fp16))[name = tensor("input_663_cast_fp16")]; tensor var_3034_begin_0 = const()[name = tensor("op_3034_begin_0"), val = tensor([0, 7, 0])]; tensor var_3034_end_0 = const()[name = tensor("op_3034_end_0"), val = tensor([1, 42, 1024])]; tensor var_3034_end_mask_0 = const()[name = tensor("op_3034_end_mask_0"), val = tensor([true, true, true])]; tensor var_3034_cast_fp16 = slice_by_index(begin = var_3034_begin_0, end = var_3034_end_0, end_mask = var_3034_end_mask_0, x = cache_49_cast_fp16)[name = tensor("op_3034_cast_fp16")]; tensor var_3040_interleave_0 = const()[name = tensor("op_3040_interleave_0"), val = tensor(false)]; tensor var_3040_cast_fp16 = concat(axis = var_68, interleave = var_3040_interleave_0, values = (var_3034_cast_fp16, key_25_cast_fp16))[name = tensor("op_3040_cast_fp16")]; tensor encoder_layers_12_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252998272))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253784768))), name = tensor("encoder_layers_12_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_12_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253784960)))]; tensor linear_111_cast_fp16 = linear(bias = encoder_layers_12_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_12_self_attn_linear_q_weight_to_fp16_palettized, x = key_25_cast_fp16)[name = tensor("linear_111_cast_fp16")]; tensor var_3045 = const()[name = tensor("op_3045"), val = tensor([1, -1, 8, 128])]; tensor q_73_cast_fp16 = reshape(shape = var_3045, x = linear_111_cast_fp16)[name = tensor("q_73_cast_fp16")]; tensor encoder_layers_12_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253787072))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254573568))), name = tensor("encoder_layers_12_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_12_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254573760)))]; tensor linear_112_cast_fp16 = linear(bias = encoder_layers_12_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_12_self_attn_linear_k_weight_to_fp16_palettized, x = input_663_cast_fp16)[name = tensor("linear_112_cast_fp16")]; tensor var_3050 = const()[name = tensor("op_3050"), val = tensor([1, -1, 8, 128])]; tensor k_49_cast_fp16 = reshape(shape = var_3050, x = linear_112_cast_fp16)[name = tensor("k_49_cast_fp16")]; tensor encoder_layers_12_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254575872))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255362368))), name = tensor("encoder_layers_12_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_12_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255362560)))]; tensor linear_113_cast_fp16 = linear(bias = encoder_layers_12_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_12_self_attn_linear_v_weight_to_fp16_palettized, x = input_663_cast_fp16)[name = tensor("linear_113_cast_fp16")]; tensor var_3055 = const()[name = tensor("op_3055"), val = tensor([1, -1, 8, 128])]; tensor v_25_cast_fp16 = reshape(shape = var_3055, x = linear_113_cast_fp16)[name = tensor("v_25_cast_fp16")]; tensor value_33_perm_0 = const()[name = tensor("value_33_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_12_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255364672)))]; tensor var_3068_cast_fp16 = add(x = q_73_cast_fp16, y = encoder_layers_12_self_attn_pos_bias_u_to_fp16)[name = tensor("op_3068_cast_fp16")]; tensor encoder_layers_12_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255366784)))]; tensor var_3070_cast_fp16 = add(x = q_73_cast_fp16, y = encoder_layers_12_self_attn_pos_bias_v_to_fp16)[name = tensor("op_3070_cast_fp16")]; tensor q_with_bias_v_25_perm_0 = const()[name = tensor("q_with_bias_v_25_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_319_transpose_x_0 = const()[name = tensor("x_319_transpose_x_0"), val = tensor(false)]; tensor x_319_transpose_y_0 = const()[name = tensor("x_319_transpose_y_0"), val = tensor(false)]; tensor op_3072_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_3072_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255368896))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255468480))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255468288)))]; tensor q_with_bias_v_25_cast_fp16 = transpose(perm = q_with_bias_v_25_perm_0, x = var_3070_cast_fp16)[name = tensor("transpose_254")]; tensor x_319_cast_fp16 = matmul(transpose_x = x_319_transpose_x_0, transpose_y = x_319_transpose_y_0, x = q_with_bias_v_25_cast_fp16, y = op_3072_to_fp16_quantized)[name = tensor("x_319_cast_fp16")]; tensor x_321_pad_0 = const()[name = tensor("x_321_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_321_mode_0 = const()[name = tensor("x_321_mode_0"), val = tensor("constant")]; tensor const_235_to_fp16 = const()[name = tensor("const_235_to_fp16"), val = tensor(0x0p+0)]; tensor x_321_cast_fp16 = pad(constant_val = const_235_to_fp16, mode = x_321_mode_0, pad = x_321_pad_0, x = x_319_cast_fp16)[name = tensor("x_321_cast_fp16")]; tensor var_3080 = const()[name = tensor("op_3080"), val = tensor([1, 8, -1, 7])]; tensor x_323_cast_fp16 = reshape(shape = var_3080, x = x_321_cast_fp16)[name = tensor("x_323_cast_fp16")]; tensor var_3084_begin_0 = const()[name = tensor("op_3084_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_3084_end_0 = const()[name = tensor("op_3084_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_3084_end_mask_0 = const()[name = tensor("op_3084_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_3084_cast_fp16 = slice_by_index(begin = var_3084_begin_0, end = var_3084_end_0, end_mask = var_3084_end_mask_0, x = x_323_cast_fp16)[name = tensor("op_3084_cast_fp16")]; tensor var_3085 = const()[name = tensor("op_3085"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_49_cast_fp16 = reshape(shape = var_3085, x = var_3084_cast_fp16)[name = tensor("matrix_bd_49_cast_fp16")]; tensor matrix_ac_25_transpose_x_0 = const()[name = tensor("matrix_ac_25_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_25_transpose_y_0 = const()[name = tensor("matrix_ac_25_transpose_y_0"), val = tensor(false)]; tensor transpose_120_perm_0 = const()[name = tensor("transpose_120_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_121_perm_0 = const()[name = tensor("transpose_121_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_121 = transpose(perm = transpose_121_perm_0, x = k_49_cast_fp16)[name = tensor("transpose_252")]; tensor transpose_120 = transpose(perm = transpose_120_perm_0, x = var_3068_cast_fp16)[name = tensor("transpose_253")]; tensor matrix_ac_25_cast_fp16 = matmul(transpose_x = matrix_ac_25_transpose_x_0, transpose_y = matrix_ac_25_transpose_y_0, x = transpose_120, y = transpose_121)[name = tensor("matrix_ac_25_cast_fp16")]; tensor matrix_bd_51_begin_0 = const()[name = tensor("matrix_bd_51_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_51_end_0 = const()[name = tensor("matrix_bd_51_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_51_end_mask_0 = const()[name = tensor("matrix_bd_51_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_51_cast_fp16 = slice_by_index(begin = matrix_bd_51_begin_0, end = matrix_bd_51_end_0, end_mask = matrix_bd_51_end_mask_0, x = matrix_bd_49_cast_fp16)[name = tensor("matrix_bd_51_cast_fp16")]; tensor var_3094_cast_fp16 = add(x = matrix_ac_25_cast_fp16, y = matrix_bd_51_cast_fp16)[name = tensor("op_3094_cast_fp16")]; tensor _inversed_scores_49_y_0_to_fp16 = const()[name = tensor("_inversed_scores_49_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_49_cast_fp16 = mul(x = var_3094_cast_fp16, y = _inversed_scores_49_y_0_to_fp16)[name = tensor("_inversed_scores_49_cast_fp16")]; tensor scores_51_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_49_cast_fp16, cond = mask_11)[name = tensor("scores_51_cast_fp16")]; tensor var_3100_cast_fp16 = softmax(axis = var_59, x = scores_51_cast_fp16)[name = tensor("op_3100_cast_fp16")]; tensor input_665_cast_fp16 = select(a = var_44_to_fp16, b = var_3100_cast_fp16, cond = mask_11)[name = tensor("input_665_cast_fp16")]; tensor x_325_transpose_x_0 = const()[name = tensor("x_325_transpose_x_0"), val = tensor(false)]; tensor x_325_transpose_y_0 = const()[name = tensor("x_325_transpose_y_0"), val = tensor(false)]; tensor value_33_cast_fp16 = transpose(perm = value_33_perm_0, x = v_25_cast_fp16)[name = tensor("transpose_251")]; tensor x_325_cast_fp16 = matmul(transpose_x = x_325_transpose_x_0, transpose_y = x_325_transpose_y_0, x = input_665_cast_fp16, y = value_33_cast_fp16)[name = tensor("x_325_cast_fp16")]; tensor var_3104_perm_0 = const()[name = tensor("op_3104_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3105 = const()[name = tensor("op_3105"), val = tensor([1, -1, 1024])]; tensor var_3104_cast_fp16 = transpose(perm = var_3104_perm_0, x = x_325_cast_fp16)[name = tensor("transpose_250")]; tensor input_667_cast_fp16 = reshape(shape = var_3105, x = var_3104_cast_fp16)[name = tensor("input_667_cast_fp16")]; tensor encoder_layers_12_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255468800))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256255296))), name = tensor("encoder_layers_12_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_12_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256255488)))]; tensor linear_115_cast_fp16 = linear(bias = encoder_layers_12_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_12_self_attn_linear_out_weight_to_fp16_palettized, x = input_667_cast_fp16)[name = tensor("linear_115_cast_fp16")]; tensor input_671_cast_fp16 = add(x = input_661_cast_fp16, y = linear_115_cast_fp16)[name = tensor("input_671_cast_fp16")]; tensor x_329_axes_0 = const()[name = tensor("x_329_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256257600)))]; tensor encoder_layers_12_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256259712)))]; tensor x_329_cast_fp16 = layer_norm(axes = x_329_axes_0, beta = encoder_layers_12_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_12_norm_conv_weight_to_fp16, x = input_671_cast_fp16)[name = tensor("x_329_cast_fp16")]; tensor input_673_perm_0 = const()[name = tensor("input_673_perm_0"), val = tensor([0, 2, 1])]; tensor input_675_pad_type_0 = const()[name = tensor("input_675_pad_type_0"), val = tensor("valid")]; tensor input_675_strides_0 = const()[name = tensor("input_675_strides_0"), val = tensor([1])]; tensor input_675_pad_0 = const()[name = tensor("input_675_pad_0"), val = tensor([0, 0])]; tensor input_675_dilations_0 = const()[name = tensor("input_675_dilations_0"), val = tensor([1])]; tensor input_675_groups_0 = const()[name = tensor("input_675_groups_0"), val = tensor(1)]; tensor encoder_layers_12_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_12_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256261824))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(258359040))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_673_cast_fp16 = transpose(perm = input_673_perm_0, x = x_329_cast_fp16)[name = tensor("transpose_249")]; tensor input_675_cast_fp16 = conv(dilations = input_675_dilations_0, groups = input_675_groups_0, pad = input_675_pad_0, pad_type = input_675_pad_type_0, strides = input_675_strides_0, weight = encoder_layers_12_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_673_cast_fp16)[name = tensor("input_675_cast_fp16")]; tensor x_331_split_num_splits_0 = const()[name = tensor("x_331_split_num_splits_0"), val = tensor(2)]; tensor x_331_split_axis_0 = const()[name = tensor("x_331_split_axis_0"), val = tensor(1)]; tensor x_331_split_cast_fp16_0, tensor x_331_split_cast_fp16_1 = split(axis = x_331_split_axis_0, num_splits = x_331_split_num_splits_0, x = input_675_cast_fp16)[name = tensor("x_331_split_cast_fp16")]; tensor x_331_split_1_sigmoid_cast_fp16 = sigmoid(x = x_331_split_cast_fp16_1)[name = tensor("x_331_split_1_sigmoid_cast_fp16")]; tensor x_331_cast_fp16 = mul(x = x_331_split_cast_fp16_0, y = x_331_split_1_sigmoid_cast_fp16)[name = tensor("x_331_cast_fp16")]; tensor input_677_cast_fp16 = select(a = var_44_to_fp16, b = x_331_cast_fp16, cond = var_575)[name = tensor("input_677_cast_fp16")]; tensor new_x_51_interleave_0 = const()[name = tensor("new_x_51_interleave_0"), val = tensor(false)]; tensor new_x_51_cast_fp16 = concat(axis = var_59, interleave = new_x_51_interleave_0, values = (cache_51_cast_fp16, input_677_cast_fp16))[name = tensor("new_x_51_cast_fp16")]; tensor var_3144_begin_0 = const()[name = tensor("op_3144_begin_0"), val = tensor([0, 0, 7])]; tensor var_3144_end_0 = const()[name = tensor("op_3144_end_0"), val = tensor([1, 1024, 15])]; tensor var_3144_end_mask_0 = const()[name = tensor("op_3144_end_mask_0"), val = tensor([true, true, true])]; tensor var_3144_cast_fp16 = slice_by_index(begin = var_3144_begin_0, end = var_3144_end_0, end_mask = var_3144_end_mask_0, x = new_x_51_cast_fp16)[name = tensor("op_3144_cast_fp16")]; tensor x_333_pad_type_0 = const()[name = tensor("x_333_pad_type_0"), val = tensor("valid")]; tensor x_333_groups_0 = const()[name = tensor("x_333_groups_0"), val = tensor(1024)]; tensor x_333_strides_0 = const()[name = tensor("x_333_strides_0"), val = tensor([1])]; tensor x_333_pad_0 = const()[name = tensor("x_333_pad_0"), val = tensor([0, 0])]; tensor x_333_dilations_0 = const()[name = tensor("x_333_dilations_0"), val = tensor([1])]; tensor encoder_layers_12_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_12_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(258363200))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(258372480))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_333_cast_fp16 = conv(dilations = x_333_dilations_0, groups = x_333_groups_0, pad = x_333_pad_0, pad_type = x_333_pad_type_0, strides = x_333_strides_0, weight = encoder_layers_12_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_51_cast_fp16)[name = tensor("x_333_cast_fp16")]; tensor input_679_perm_0 = const()[name = tensor("input_679_perm_0"), val = tensor([0, 2, 1])]; tensor x_335_axes_0 = const()[name = tensor("x_335_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_12_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(258374592)))]; tensor encoder_layers_12_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_12_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(258376704)))]; tensor input_679_cast_fp16 = transpose(perm = input_679_perm_0, x = x_333_cast_fp16)[name = tensor("transpose_248")]; tensor x_335_cast_fp16 = layer_norm(axes = x_335_axes_0, beta = encoder_layers_12_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_12_conv_batch_norm_weight_to_fp16, x = input_679_cast_fp16)[name = tensor("x_335_cast_fp16")]; tensor input_681_perm_0 = const()[name = tensor("input_681_perm_0"), val = tensor([0, 2, 1])]; tensor input_681_cast_fp16 = transpose(perm = input_681_perm_0, x = x_335_cast_fp16)[name = tensor("transpose_247")]; tensor input_683_cast_fp16 = silu(x = input_681_cast_fp16)[name = tensor("input_683_cast_fp16")]; tensor x_337_pad_type_0 = const()[name = tensor("x_337_pad_type_0"), val = tensor("valid")]; tensor x_337_strides_0 = const()[name = tensor("x_337_strides_0"), val = tensor([1])]; tensor x_337_pad_0 = const()[name = tensor("x_337_pad_0"), val = tensor([0, 0])]; tensor x_337_dilations_0 = const()[name = tensor("x_337_dilations_0"), val = tensor([1])]; tensor x_337_groups_0 = const()[name = tensor("x_337_groups_0"), val = tensor(1)]; tensor encoder_layers_12_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_12_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(258378816))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259427456))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_337_cast_fp16 = conv(dilations = x_337_dilations_0, groups = x_337_groups_0, pad = x_337_pad_0, pad_type = x_337_pad_type_0, strides = x_337_strides_0, weight = encoder_layers_12_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_683_cast_fp16)[name = tensor("x_337_cast_fp16")]; tensor input_685_perm_0 = const()[name = tensor("input_685_perm_0"), val = tensor([0, 2, 1])]; tensor input_685_cast_fp16 = transpose(perm = input_685_perm_0, x = x_337_cast_fp16)[name = tensor("transpose_246")]; tensor input_687_cast_fp16 = add(x = input_671_cast_fp16, y = input_685_cast_fp16)[name = tensor("input_687_cast_fp16")]; tensor input_689_axes_0 = const()[name = tensor("input_689_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259429568)))]; tensor encoder_layers_12_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259431680)))]; tensor input_689_cast_fp16 = layer_norm(axes = input_689_axes_0, beta = encoder_layers_12_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_12_norm_feed_forward2_weight_to_fp16, x = input_687_cast_fp16)[name = tensor("input_689_cast_fp16")]; tensor encoder_layers_12_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259433792))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(262579584))), name = tensor("encoder_layers_12_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_12_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_12_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(262579776)))]; tensor linear_116_cast_fp16 = linear(bias = encoder_layers_12_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_12_feed_forward2_linear1_weight_to_fp16_palettized, x = input_689_cast_fp16)[name = tensor("linear_116_cast_fp16")]; tensor input_693_cast_fp16 = silu(x = linear_116_cast_fp16)[name = tensor("input_693_cast_fp16")]; tensor encoder_layers_12_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(262588032))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265733824))), name = tensor("encoder_layers_12_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_12_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_12_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265734016)))]; tensor linear_117_cast_fp16 = linear(bias = encoder_layers_12_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_12_feed_forward2_linear2_weight_to_fp16_palettized, x = input_693_cast_fp16)[name = tensor("linear_117_cast_fp16")]; tensor var_3187_to_fp16 = const()[name = tensor("op_3187_to_fp16"), val = tensor(0x1p-1)]; tensor var_3188_cast_fp16 = mul(x = linear_117_cast_fp16, y = var_3187_to_fp16)[name = tensor("op_3188_cast_fp16")]; tensor input_699_cast_fp16 = add(x = input_687_cast_fp16, y = var_3188_cast_fp16)[name = tensor("input_699_cast_fp16")]; tensor input_701_axes_0 = const()[name = tensor("input_701_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265736128)))]; tensor encoder_layers_12_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265738240)))]; tensor input_701_cast_fp16 = layer_norm(axes = input_701_axes_0, beta = encoder_layers_12_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_12_norm_out_weight_to_fp16, x = input_699_cast_fp16)[name = tensor("input_701_cast_fp16")]; tensor cache_53_begin_0 = const()[name = tensor("cache_53_begin_0"), val = tensor([13, 0, 0, 0])]; tensor cache_53_end_0 = const()[name = tensor("cache_53_end_0"), val = tensor([14, 1, 42, 1024])]; tensor cache_53_end_mask_0 = const()[name = tensor("cache_53_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_53_squeeze_mask_0 = const()[name = tensor("cache_53_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_53_cast_fp16 = slice_by_index(begin = cache_53_begin_0, end = cache_53_end_0, end_mask = cache_53_end_mask_0, squeeze_mask = cache_53_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_53_cast_fp16")]; tensor cache_55_begin_0 = const()[name = tensor("cache_55_begin_0"), val = tensor([13, 0, 0, 0])]; tensor cache_55_end_0 = const()[name = tensor("cache_55_end_0"), val = tensor([14, 1, 1024, 8])]; tensor cache_55_end_mask_0 = const()[name = tensor("cache_55_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_55_squeeze_mask_0 = const()[name = tensor("cache_55_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_55_cast_fp16 = slice_by_index(begin = cache_55_begin_0, end = cache_55_end_0, end_mask = cache_55_end_mask_0, squeeze_mask = cache_55_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_55_cast_fp16")]; tensor input_703_axes_0 = const()[name = tensor("input_703_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265740352)))]; tensor encoder_layers_13_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265742464)))]; tensor input_703_cast_fp16 = layer_norm(axes = input_703_axes_0, beta = encoder_layers_13_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_13_norm_feed_forward1_weight_to_fp16, x = input_701_cast_fp16)[name = tensor("input_703_cast_fp16")]; tensor encoder_layers_13_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265744576))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268890368))), name = tensor("encoder_layers_13_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_13_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_13_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268890560)))]; tensor linear_118_cast_fp16 = linear(bias = encoder_layers_13_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_13_feed_forward1_linear1_weight_to_fp16_palettized, x = input_703_cast_fp16)[name = tensor("linear_118_cast_fp16")]; tensor input_707_cast_fp16 = silu(x = linear_118_cast_fp16)[name = tensor("input_707_cast_fp16")]; tensor encoder_layers_13_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268898816))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272044608))), name = tensor("encoder_layers_13_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_13_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_13_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272044800)))]; tensor linear_119_cast_fp16 = linear(bias = encoder_layers_13_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_13_feed_forward1_linear2_weight_to_fp16_palettized, x = input_707_cast_fp16)[name = tensor("linear_119_cast_fp16")]; tensor var_3224_to_fp16 = const()[name = tensor("op_3224_to_fp16"), val = tensor(0x1p-1)]; tensor var_3225_cast_fp16 = mul(x = linear_119_cast_fp16, y = var_3224_to_fp16)[name = tensor("op_3225_cast_fp16")]; tensor input_713_cast_fp16 = add(x = input_701_cast_fp16, y = var_3225_cast_fp16)[name = tensor("input_713_cast_fp16")]; tensor key_27_axes_0 = const()[name = tensor("key_27_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272046912)))]; tensor encoder_layers_13_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272049024)))]; tensor key_27_cast_fp16 = layer_norm(axes = key_27_axes_0, beta = encoder_layers_13_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_13_norm_self_att_weight_to_fp16, x = input_713_cast_fp16)[name = tensor("key_27_cast_fp16")]; tensor input_715_interleave_0 = const()[name = tensor("input_715_interleave_0"), val = tensor(false)]; tensor input_715_cast_fp16 = concat(axis = var_68, interleave = input_715_interleave_0, values = (cache_53_cast_fp16, key_27_cast_fp16))[name = tensor("input_715_cast_fp16")]; tensor var_3247_begin_0 = const()[name = tensor("op_3247_begin_0"), val = tensor([0, 7, 0])]; tensor var_3247_end_0 = const()[name = tensor("op_3247_end_0"), val = tensor([1, 42, 1024])]; tensor var_3247_end_mask_0 = const()[name = tensor("op_3247_end_mask_0"), val = tensor([true, true, true])]; tensor var_3247_cast_fp16 = slice_by_index(begin = var_3247_begin_0, end = var_3247_end_0, end_mask = var_3247_end_mask_0, x = cache_53_cast_fp16)[name = tensor("op_3247_cast_fp16")]; tensor var_3253_interleave_0 = const()[name = tensor("op_3253_interleave_0"), val = tensor(false)]; tensor var_3253_cast_fp16 = concat(axis = var_68, interleave = var_3253_interleave_0, values = (var_3247_cast_fp16, key_27_cast_fp16))[name = tensor("op_3253_cast_fp16")]; tensor encoder_layers_13_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272051136))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272837632))), name = tensor("encoder_layers_13_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_13_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272837824)))]; tensor linear_120_cast_fp16 = linear(bias = encoder_layers_13_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_13_self_attn_linear_q_weight_to_fp16_palettized, x = key_27_cast_fp16)[name = tensor("linear_120_cast_fp16")]; tensor var_3258 = const()[name = tensor("op_3258"), val = tensor([1, -1, 8, 128])]; tensor q_79_cast_fp16 = reshape(shape = var_3258, x = linear_120_cast_fp16)[name = tensor("q_79_cast_fp16")]; tensor encoder_layers_13_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272839936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(273626432))), name = tensor("encoder_layers_13_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_13_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(273626624)))]; tensor linear_121_cast_fp16 = linear(bias = encoder_layers_13_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_13_self_attn_linear_k_weight_to_fp16_palettized, x = input_715_cast_fp16)[name = tensor("linear_121_cast_fp16")]; tensor var_3263 = const()[name = tensor("op_3263"), val = tensor([1, -1, 8, 128])]; tensor k_53_cast_fp16 = reshape(shape = var_3263, x = linear_121_cast_fp16)[name = tensor("k_53_cast_fp16")]; tensor encoder_layers_13_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(273628736))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274415232))), name = tensor("encoder_layers_13_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_13_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274415424)))]; tensor linear_122_cast_fp16 = linear(bias = encoder_layers_13_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_13_self_attn_linear_v_weight_to_fp16_palettized, x = input_715_cast_fp16)[name = tensor("linear_122_cast_fp16")]; tensor var_3268 = const()[name = tensor("op_3268"), val = tensor([1, -1, 8, 128])]; tensor v_27_cast_fp16 = reshape(shape = var_3268, x = linear_122_cast_fp16)[name = tensor("v_27_cast_fp16")]; tensor value_35_perm_0 = const()[name = tensor("value_35_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_13_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274417536)))]; tensor var_3281_cast_fp16 = add(x = q_79_cast_fp16, y = encoder_layers_13_self_attn_pos_bias_u_to_fp16)[name = tensor("op_3281_cast_fp16")]; tensor encoder_layers_13_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274419648)))]; tensor var_3283_cast_fp16 = add(x = q_79_cast_fp16, y = encoder_layers_13_self_attn_pos_bias_v_to_fp16)[name = tensor("op_3283_cast_fp16")]; tensor q_with_bias_v_27_perm_0 = const()[name = tensor("q_with_bias_v_27_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_345_transpose_x_0 = const()[name = tensor("x_345_transpose_x_0"), val = tensor(false)]; tensor x_345_transpose_y_0 = const()[name = tensor("x_345_transpose_y_0"), val = tensor(false)]; tensor op_3285_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_3285_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274421760))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274521344))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274521152)))]; tensor q_with_bias_v_27_cast_fp16 = transpose(perm = q_with_bias_v_27_perm_0, x = var_3283_cast_fp16)[name = tensor("transpose_245")]; tensor x_345_cast_fp16 = matmul(transpose_x = x_345_transpose_x_0, transpose_y = x_345_transpose_y_0, x = q_with_bias_v_27_cast_fp16, y = op_3285_to_fp16_quantized)[name = tensor("x_345_cast_fp16")]; tensor x_347_pad_0 = const()[name = tensor("x_347_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_347_mode_0 = const()[name = tensor("x_347_mode_0"), val = tensor("constant")]; tensor const_248_to_fp16 = const()[name = tensor("const_248_to_fp16"), val = tensor(0x0p+0)]; tensor x_347_cast_fp16 = pad(constant_val = const_248_to_fp16, mode = x_347_mode_0, pad = x_347_pad_0, x = x_345_cast_fp16)[name = tensor("x_347_cast_fp16")]; tensor var_3293 = const()[name = tensor("op_3293"), val = tensor([1, 8, -1, 7])]; tensor x_349_cast_fp16 = reshape(shape = var_3293, x = x_347_cast_fp16)[name = tensor("x_349_cast_fp16")]; tensor var_3297_begin_0 = const()[name = tensor("op_3297_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_3297_end_0 = const()[name = tensor("op_3297_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_3297_end_mask_0 = const()[name = tensor("op_3297_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_3297_cast_fp16 = slice_by_index(begin = var_3297_begin_0, end = var_3297_end_0, end_mask = var_3297_end_mask_0, x = x_349_cast_fp16)[name = tensor("op_3297_cast_fp16")]; tensor var_3298 = const()[name = tensor("op_3298"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_53_cast_fp16 = reshape(shape = var_3298, x = var_3297_cast_fp16)[name = tensor("matrix_bd_53_cast_fp16")]; tensor matrix_ac_27_transpose_x_0 = const()[name = tensor("matrix_ac_27_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_27_transpose_y_0 = const()[name = tensor("matrix_ac_27_transpose_y_0"), val = tensor(false)]; tensor transpose_122_perm_0 = const()[name = tensor("transpose_122_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_123_perm_0 = const()[name = tensor("transpose_123_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_123 = transpose(perm = transpose_123_perm_0, x = k_53_cast_fp16)[name = tensor("transpose_243")]; tensor transpose_122 = transpose(perm = transpose_122_perm_0, x = var_3281_cast_fp16)[name = tensor("transpose_244")]; tensor matrix_ac_27_cast_fp16 = matmul(transpose_x = matrix_ac_27_transpose_x_0, transpose_y = matrix_ac_27_transpose_y_0, x = transpose_122, y = transpose_123)[name = tensor("matrix_ac_27_cast_fp16")]; tensor matrix_bd_55_begin_0 = const()[name = tensor("matrix_bd_55_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_55_end_0 = const()[name = tensor("matrix_bd_55_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_55_end_mask_0 = const()[name = tensor("matrix_bd_55_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_55_cast_fp16 = slice_by_index(begin = matrix_bd_55_begin_0, end = matrix_bd_55_end_0, end_mask = matrix_bd_55_end_mask_0, x = matrix_bd_53_cast_fp16)[name = tensor("matrix_bd_55_cast_fp16")]; tensor var_3307_cast_fp16 = add(x = matrix_ac_27_cast_fp16, y = matrix_bd_55_cast_fp16)[name = tensor("op_3307_cast_fp16")]; tensor _inversed_scores_53_y_0_to_fp16 = const()[name = tensor("_inversed_scores_53_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_53_cast_fp16 = mul(x = var_3307_cast_fp16, y = _inversed_scores_53_y_0_to_fp16)[name = tensor("_inversed_scores_53_cast_fp16")]; tensor scores_55_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_53_cast_fp16, cond = mask_11)[name = tensor("scores_55_cast_fp16")]; tensor var_3313_cast_fp16 = softmax(axis = var_59, x = scores_55_cast_fp16)[name = tensor("op_3313_cast_fp16")]; tensor input_717_cast_fp16 = select(a = var_44_to_fp16, b = var_3313_cast_fp16, cond = mask_11)[name = tensor("input_717_cast_fp16")]; tensor x_351_transpose_x_0 = const()[name = tensor("x_351_transpose_x_0"), val = tensor(false)]; tensor x_351_transpose_y_0 = const()[name = tensor("x_351_transpose_y_0"), val = tensor(false)]; tensor value_35_cast_fp16 = transpose(perm = value_35_perm_0, x = v_27_cast_fp16)[name = tensor("transpose_242")]; tensor x_351_cast_fp16 = matmul(transpose_x = x_351_transpose_x_0, transpose_y = x_351_transpose_y_0, x = input_717_cast_fp16, y = value_35_cast_fp16)[name = tensor("x_351_cast_fp16")]; tensor var_3317_perm_0 = const()[name = tensor("op_3317_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3318 = const()[name = tensor("op_3318"), val = tensor([1, -1, 1024])]; tensor var_3317_cast_fp16 = transpose(perm = var_3317_perm_0, x = x_351_cast_fp16)[name = tensor("transpose_241")]; tensor input_719_cast_fp16 = reshape(shape = var_3318, x = var_3317_cast_fp16)[name = tensor("input_719_cast_fp16")]; tensor encoder_layers_13_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274521664))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275308160))), name = tensor("encoder_layers_13_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_13_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275308352)))]; tensor linear_124_cast_fp16 = linear(bias = encoder_layers_13_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_13_self_attn_linear_out_weight_to_fp16_palettized, x = input_719_cast_fp16)[name = tensor("linear_124_cast_fp16")]; tensor input_723_cast_fp16 = add(x = input_713_cast_fp16, y = linear_124_cast_fp16)[name = tensor("input_723_cast_fp16")]; tensor x_355_axes_0 = const()[name = tensor("x_355_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275310464)))]; tensor encoder_layers_13_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275312576)))]; tensor x_355_cast_fp16 = layer_norm(axes = x_355_axes_0, beta = encoder_layers_13_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_13_norm_conv_weight_to_fp16, x = input_723_cast_fp16)[name = tensor("x_355_cast_fp16")]; tensor input_725_perm_0 = const()[name = tensor("input_725_perm_0"), val = tensor([0, 2, 1])]; tensor input_727_pad_type_0 = const()[name = tensor("input_727_pad_type_0"), val = tensor("valid")]; tensor input_727_strides_0 = const()[name = tensor("input_727_strides_0"), val = tensor([1])]; tensor input_727_pad_0 = const()[name = tensor("input_727_pad_0"), val = tensor([0, 0])]; tensor input_727_dilations_0 = const()[name = tensor("input_727_dilations_0"), val = tensor([1])]; tensor input_727_groups_0 = const()[name = tensor("input_727_groups_0"), val = tensor(1)]; tensor encoder_layers_13_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_13_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275314688))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277411904))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_725_cast_fp16 = transpose(perm = input_725_perm_0, x = x_355_cast_fp16)[name = tensor("transpose_240")]; tensor input_727_cast_fp16 = conv(dilations = input_727_dilations_0, groups = input_727_groups_0, pad = input_727_pad_0, pad_type = input_727_pad_type_0, strides = input_727_strides_0, weight = encoder_layers_13_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_725_cast_fp16)[name = tensor("input_727_cast_fp16")]; tensor x_357_split_num_splits_0 = const()[name = tensor("x_357_split_num_splits_0"), val = tensor(2)]; tensor x_357_split_axis_0 = const()[name = tensor("x_357_split_axis_0"), val = tensor(1)]; tensor x_357_split_cast_fp16_0, tensor x_357_split_cast_fp16_1 = split(axis = x_357_split_axis_0, num_splits = x_357_split_num_splits_0, x = input_727_cast_fp16)[name = tensor("x_357_split_cast_fp16")]; tensor x_357_split_1_sigmoid_cast_fp16 = sigmoid(x = x_357_split_cast_fp16_1)[name = tensor("x_357_split_1_sigmoid_cast_fp16")]; tensor x_357_cast_fp16 = mul(x = x_357_split_cast_fp16_0, y = x_357_split_1_sigmoid_cast_fp16)[name = tensor("x_357_cast_fp16")]; tensor input_729_cast_fp16 = select(a = var_44_to_fp16, b = x_357_cast_fp16, cond = var_575)[name = tensor("input_729_cast_fp16")]; tensor new_x_55_interleave_0 = const()[name = tensor("new_x_55_interleave_0"), val = tensor(false)]; tensor new_x_55_cast_fp16 = concat(axis = var_59, interleave = new_x_55_interleave_0, values = (cache_55_cast_fp16, input_729_cast_fp16))[name = tensor("new_x_55_cast_fp16")]; tensor var_3357_begin_0 = const()[name = tensor("op_3357_begin_0"), val = tensor([0, 0, 7])]; tensor var_3357_end_0 = const()[name = tensor("op_3357_end_0"), val = tensor([1, 1024, 15])]; tensor var_3357_end_mask_0 = const()[name = tensor("op_3357_end_mask_0"), val = tensor([true, true, true])]; tensor var_3357_cast_fp16 = slice_by_index(begin = var_3357_begin_0, end = var_3357_end_0, end_mask = var_3357_end_mask_0, x = new_x_55_cast_fp16)[name = tensor("op_3357_cast_fp16")]; tensor x_359_pad_type_0 = const()[name = tensor("x_359_pad_type_0"), val = tensor("valid")]; tensor x_359_groups_0 = const()[name = tensor("x_359_groups_0"), val = tensor(1024)]; tensor x_359_strides_0 = const()[name = tensor("x_359_strides_0"), val = tensor([1])]; tensor x_359_pad_0 = const()[name = tensor("x_359_pad_0"), val = tensor([0, 0])]; tensor x_359_dilations_0 = const()[name = tensor("x_359_dilations_0"), val = tensor([1])]; tensor encoder_layers_13_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_13_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277416064))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277425344))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_359_cast_fp16 = conv(dilations = x_359_dilations_0, groups = x_359_groups_0, pad = x_359_pad_0, pad_type = x_359_pad_type_0, strides = x_359_strides_0, weight = encoder_layers_13_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_55_cast_fp16)[name = tensor("x_359_cast_fp16")]; tensor input_731_perm_0 = const()[name = tensor("input_731_perm_0"), val = tensor([0, 2, 1])]; tensor x_361_axes_0 = const()[name = tensor("x_361_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_13_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277427456)))]; tensor encoder_layers_13_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_13_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277429568)))]; tensor input_731_cast_fp16 = transpose(perm = input_731_perm_0, x = x_359_cast_fp16)[name = tensor("transpose_239")]; tensor x_361_cast_fp16 = layer_norm(axes = x_361_axes_0, beta = encoder_layers_13_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_13_conv_batch_norm_weight_to_fp16, x = input_731_cast_fp16)[name = tensor("x_361_cast_fp16")]; tensor input_733_perm_0 = const()[name = tensor("input_733_perm_0"), val = tensor([0, 2, 1])]; tensor input_733_cast_fp16 = transpose(perm = input_733_perm_0, x = x_361_cast_fp16)[name = tensor("transpose_238")]; tensor input_735_cast_fp16 = silu(x = input_733_cast_fp16)[name = tensor("input_735_cast_fp16")]; tensor x_363_pad_type_0 = const()[name = tensor("x_363_pad_type_0"), val = tensor("valid")]; tensor x_363_strides_0 = const()[name = tensor("x_363_strides_0"), val = tensor([1])]; tensor x_363_pad_0 = const()[name = tensor("x_363_pad_0"), val = tensor([0, 0])]; tensor x_363_dilations_0 = const()[name = tensor("x_363_dilations_0"), val = tensor([1])]; tensor x_363_groups_0 = const()[name = tensor("x_363_groups_0"), val = tensor(1)]; tensor encoder_layers_13_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_13_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277431680))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278480320))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_363_cast_fp16 = conv(dilations = x_363_dilations_0, groups = x_363_groups_0, pad = x_363_pad_0, pad_type = x_363_pad_type_0, strides = x_363_strides_0, weight = encoder_layers_13_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_735_cast_fp16)[name = tensor("x_363_cast_fp16")]; tensor input_737_perm_0 = const()[name = tensor("input_737_perm_0"), val = tensor([0, 2, 1])]; tensor input_737_cast_fp16 = transpose(perm = input_737_perm_0, x = x_363_cast_fp16)[name = tensor("transpose_237")]; tensor input_739_cast_fp16 = add(x = input_723_cast_fp16, y = input_737_cast_fp16)[name = tensor("input_739_cast_fp16")]; tensor input_741_axes_0 = const()[name = tensor("input_741_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278482432)))]; tensor encoder_layers_13_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278484544)))]; tensor input_741_cast_fp16 = layer_norm(axes = input_741_axes_0, beta = encoder_layers_13_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_13_norm_feed_forward2_weight_to_fp16, x = input_739_cast_fp16)[name = tensor("input_741_cast_fp16")]; tensor encoder_layers_13_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278486656))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(281632448))), name = tensor("encoder_layers_13_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_13_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_13_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(281632640)))]; tensor linear_125_cast_fp16 = linear(bias = encoder_layers_13_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_13_feed_forward2_linear1_weight_to_fp16_palettized, x = input_741_cast_fp16)[name = tensor("linear_125_cast_fp16")]; tensor input_745_cast_fp16 = silu(x = linear_125_cast_fp16)[name = tensor("input_745_cast_fp16")]; tensor encoder_layers_13_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(281640896))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284786688))), name = tensor("encoder_layers_13_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_13_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_13_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284786880)))]; tensor linear_126_cast_fp16 = linear(bias = encoder_layers_13_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_13_feed_forward2_linear2_weight_to_fp16_palettized, x = input_745_cast_fp16)[name = tensor("linear_126_cast_fp16")]; tensor var_3400_to_fp16 = const()[name = tensor("op_3400_to_fp16"), val = tensor(0x1p-1)]; tensor var_3401_cast_fp16 = mul(x = linear_126_cast_fp16, y = var_3400_to_fp16)[name = tensor("op_3401_cast_fp16")]; tensor input_751_cast_fp16 = add(x = input_739_cast_fp16, y = var_3401_cast_fp16)[name = tensor("input_751_cast_fp16")]; tensor input_753_axes_0 = const()[name = tensor("input_753_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284788992)))]; tensor encoder_layers_13_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284791104)))]; tensor input_753_cast_fp16 = layer_norm(axes = input_753_axes_0, beta = encoder_layers_13_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_13_norm_out_weight_to_fp16, x = input_751_cast_fp16)[name = tensor("input_753_cast_fp16")]; tensor cache_57_begin_0 = const()[name = tensor("cache_57_begin_0"), val = tensor([14, 0, 0, 0])]; tensor cache_57_end_0 = const()[name = tensor("cache_57_end_0"), val = tensor([15, 1, 42, 1024])]; tensor cache_57_end_mask_0 = const()[name = tensor("cache_57_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_57_squeeze_mask_0 = const()[name = tensor("cache_57_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_57_cast_fp16 = slice_by_index(begin = cache_57_begin_0, end = cache_57_end_0, end_mask = cache_57_end_mask_0, squeeze_mask = cache_57_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_57_cast_fp16")]; tensor cache_59_begin_0 = const()[name = tensor("cache_59_begin_0"), val = tensor([14, 0, 0, 0])]; tensor cache_59_end_0 = const()[name = tensor("cache_59_end_0"), val = tensor([15, 1, 1024, 8])]; tensor cache_59_end_mask_0 = const()[name = tensor("cache_59_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_59_squeeze_mask_0 = const()[name = tensor("cache_59_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_59_cast_fp16 = slice_by_index(begin = cache_59_begin_0, end = cache_59_end_0, end_mask = cache_59_end_mask_0, squeeze_mask = cache_59_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_59_cast_fp16")]; tensor input_755_axes_0 = const()[name = tensor("input_755_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284793216)))]; tensor encoder_layers_14_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284795328)))]; tensor input_755_cast_fp16 = layer_norm(axes = input_755_axes_0, beta = encoder_layers_14_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_14_norm_feed_forward1_weight_to_fp16, x = input_753_cast_fp16)[name = tensor("input_755_cast_fp16")]; tensor encoder_layers_14_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284797440))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(287943232))), name = tensor("encoder_layers_14_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_14_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_14_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(287943424)))]; tensor linear_127_cast_fp16 = linear(bias = encoder_layers_14_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_14_feed_forward1_linear1_weight_to_fp16_palettized, x = input_755_cast_fp16)[name = tensor("linear_127_cast_fp16")]; tensor input_759_cast_fp16 = silu(x = linear_127_cast_fp16)[name = tensor("input_759_cast_fp16")]; tensor encoder_layers_14_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(287951680))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291097472))), name = tensor("encoder_layers_14_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_14_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_14_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291097664)))]; tensor linear_128_cast_fp16 = linear(bias = encoder_layers_14_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_14_feed_forward1_linear2_weight_to_fp16_palettized, x = input_759_cast_fp16)[name = tensor("linear_128_cast_fp16")]; tensor var_3437_to_fp16 = const()[name = tensor("op_3437_to_fp16"), val = tensor(0x1p-1)]; tensor var_3438_cast_fp16 = mul(x = linear_128_cast_fp16, y = var_3437_to_fp16)[name = tensor("op_3438_cast_fp16")]; tensor input_765_cast_fp16 = add(x = input_753_cast_fp16, y = var_3438_cast_fp16)[name = tensor("input_765_cast_fp16")]; tensor key_29_axes_0 = const()[name = tensor("key_29_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291099776)))]; tensor encoder_layers_14_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291101888)))]; tensor key_29_cast_fp16 = layer_norm(axes = key_29_axes_0, beta = encoder_layers_14_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_14_norm_self_att_weight_to_fp16, x = input_765_cast_fp16)[name = tensor("key_29_cast_fp16")]; tensor input_767_interleave_0 = const()[name = tensor("input_767_interleave_0"), val = tensor(false)]; tensor input_767_cast_fp16 = concat(axis = var_68, interleave = input_767_interleave_0, values = (cache_57_cast_fp16, key_29_cast_fp16))[name = tensor("input_767_cast_fp16")]; tensor var_3460_begin_0 = const()[name = tensor("op_3460_begin_0"), val = tensor([0, 7, 0])]; tensor var_3460_end_0 = const()[name = tensor("op_3460_end_0"), val = tensor([1, 42, 1024])]; tensor var_3460_end_mask_0 = const()[name = tensor("op_3460_end_mask_0"), val = tensor([true, true, true])]; tensor var_3460_cast_fp16 = slice_by_index(begin = var_3460_begin_0, end = var_3460_end_0, end_mask = var_3460_end_mask_0, x = cache_57_cast_fp16)[name = tensor("op_3460_cast_fp16")]; tensor var_3466_interleave_0 = const()[name = tensor("op_3466_interleave_0"), val = tensor(false)]; tensor var_3466_cast_fp16 = concat(axis = var_68, interleave = var_3466_interleave_0, values = (var_3460_cast_fp16, key_29_cast_fp16))[name = tensor("op_3466_cast_fp16")]; tensor encoder_layers_14_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291104000))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291890496))), name = tensor("encoder_layers_14_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_14_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291890688)))]; tensor linear_129_cast_fp16 = linear(bias = encoder_layers_14_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_14_self_attn_linear_q_weight_to_fp16_palettized, x = key_29_cast_fp16)[name = tensor("linear_129_cast_fp16")]; tensor var_3471 = const()[name = tensor("op_3471"), val = tensor([1, -1, 8, 128])]; tensor q_85_cast_fp16 = reshape(shape = var_3471, x = linear_129_cast_fp16)[name = tensor("q_85_cast_fp16")]; tensor encoder_layers_14_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291892800))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292679296))), name = tensor("encoder_layers_14_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_14_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292679488)))]; tensor linear_130_cast_fp16 = linear(bias = encoder_layers_14_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_14_self_attn_linear_k_weight_to_fp16_palettized, x = input_767_cast_fp16)[name = tensor("linear_130_cast_fp16")]; tensor var_3476 = const()[name = tensor("op_3476"), val = tensor([1, -1, 8, 128])]; tensor k_57_cast_fp16 = reshape(shape = var_3476, x = linear_130_cast_fp16)[name = tensor("k_57_cast_fp16")]; tensor encoder_layers_14_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292681600))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293468096))), name = tensor("encoder_layers_14_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_14_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293468288)))]; tensor linear_131_cast_fp16 = linear(bias = encoder_layers_14_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_14_self_attn_linear_v_weight_to_fp16_palettized, x = input_767_cast_fp16)[name = tensor("linear_131_cast_fp16")]; tensor var_3481 = const()[name = tensor("op_3481"), val = tensor([1, -1, 8, 128])]; tensor v_29_cast_fp16 = reshape(shape = var_3481, x = linear_131_cast_fp16)[name = tensor("v_29_cast_fp16")]; tensor value_37_perm_0 = const()[name = tensor("value_37_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_14_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293470400)))]; tensor var_3494_cast_fp16 = add(x = q_85_cast_fp16, y = encoder_layers_14_self_attn_pos_bias_u_to_fp16)[name = tensor("op_3494_cast_fp16")]; tensor encoder_layers_14_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293472512)))]; tensor var_3496_cast_fp16 = add(x = q_85_cast_fp16, y = encoder_layers_14_self_attn_pos_bias_v_to_fp16)[name = tensor("op_3496_cast_fp16")]; tensor q_with_bias_v_29_perm_0 = const()[name = tensor("q_with_bias_v_29_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_371_transpose_x_0 = const()[name = tensor("x_371_transpose_x_0"), val = tensor(false)]; tensor x_371_transpose_y_0 = const()[name = tensor("x_371_transpose_y_0"), val = tensor(false)]; tensor op_3498_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_3498_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293474624))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293574208))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293574016)))]; tensor q_with_bias_v_29_cast_fp16 = transpose(perm = q_with_bias_v_29_perm_0, x = var_3496_cast_fp16)[name = tensor("transpose_236")]; tensor x_371_cast_fp16 = matmul(transpose_x = x_371_transpose_x_0, transpose_y = x_371_transpose_y_0, x = q_with_bias_v_29_cast_fp16, y = op_3498_to_fp16_quantized)[name = tensor("x_371_cast_fp16")]; tensor x_373_pad_0 = const()[name = tensor("x_373_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_373_mode_0 = const()[name = tensor("x_373_mode_0"), val = tensor("constant")]; tensor const_261_to_fp16 = const()[name = tensor("const_261_to_fp16"), val = tensor(0x0p+0)]; tensor x_373_cast_fp16 = pad(constant_val = const_261_to_fp16, mode = x_373_mode_0, pad = x_373_pad_0, x = x_371_cast_fp16)[name = tensor("x_373_cast_fp16")]; tensor var_3506 = const()[name = tensor("op_3506"), val = tensor([1, 8, -1, 7])]; tensor x_375_cast_fp16 = reshape(shape = var_3506, x = x_373_cast_fp16)[name = tensor("x_375_cast_fp16")]; tensor var_3510_begin_0 = const()[name = tensor("op_3510_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_3510_end_0 = const()[name = tensor("op_3510_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_3510_end_mask_0 = const()[name = tensor("op_3510_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_3510_cast_fp16 = slice_by_index(begin = var_3510_begin_0, end = var_3510_end_0, end_mask = var_3510_end_mask_0, x = x_375_cast_fp16)[name = tensor("op_3510_cast_fp16")]; tensor var_3511 = const()[name = tensor("op_3511"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_57_cast_fp16 = reshape(shape = var_3511, x = var_3510_cast_fp16)[name = tensor("matrix_bd_57_cast_fp16")]; tensor matrix_ac_29_transpose_x_0 = const()[name = tensor("matrix_ac_29_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_29_transpose_y_0 = const()[name = tensor("matrix_ac_29_transpose_y_0"), val = tensor(false)]; tensor transpose_124_perm_0 = const()[name = tensor("transpose_124_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_125_perm_0 = const()[name = tensor("transpose_125_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_125 = transpose(perm = transpose_125_perm_0, x = k_57_cast_fp16)[name = tensor("transpose_234")]; tensor transpose_124 = transpose(perm = transpose_124_perm_0, x = var_3494_cast_fp16)[name = tensor("transpose_235")]; tensor matrix_ac_29_cast_fp16 = matmul(transpose_x = matrix_ac_29_transpose_x_0, transpose_y = matrix_ac_29_transpose_y_0, x = transpose_124, y = transpose_125)[name = tensor("matrix_ac_29_cast_fp16")]; tensor matrix_bd_59_begin_0 = const()[name = tensor("matrix_bd_59_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_59_end_0 = const()[name = tensor("matrix_bd_59_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_59_end_mask_0 = const()[name = tensor("matrix_bd_59_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_59_cast_fp16 = slice_by_index(begin = matrix_bd_59_begin_0, end = matrix_bd_59_end_0, end_mask = matrix_bd_59_end_mask_0, x = matrix_bd_57_cast_fp16)[name = tensor("matrix_bd_59_cast_fp16")]; tensor var_3520_cast_fp16 = add(x = matrix_ac_29_cast_fp16, y = matrix_bd_59_cast_fp16)[name = tensor("op_3520_cast_fp16")]; tensor _inversed_scores_57_y_0_to_fp16 = const()[name = tensor("_inversed_scores_57_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_57_cast_fp16 = mul(x = var_3520_cast_fp16, y = _inversed_scores_57_y_0_to_fp16)[name = tensor("_inversed_scores_57_cast_fp16")]; tensor scores_59_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_57_cast_fp16, cond = mask_11)[name = tensor("scores_59_cast_fp16")]; tensor var_3526_cast_fp16 = softmax(axis = var_59, x = scores_59_cast_fp16)[name = tensor("op_3526_cast_fp16")]; tensor input_769_cast_fp16 = select(a = var_44_to_fp16, b = var_3526_cast_fp16, cond = mask_11)[name = tensor("input_769_cast_fp16")]; tensor x_377_transpose_x_0 = const()[name = tensor("x_377_transpose_x_0"), val = tensor(false)]; tensor x_377_transpose_y_0 = const()[name = tensor("x_377_transpose_y_0"), val = tensor(false)]; tensor value_37_cast_fp16 = transpose(perm = value_37_perm_0, x = v_29_cast_fp16)[name = tensor("transpose_233")]; tensor x_377_cast_fp16 = matmul(transpose_x = x_377_transpose_x_0, transpose_y = x_377_transpose_y_0, x = input_769_cast_fp16, y = value_37_cast_fp16)[name = tensor("x_377_cast_fp16")]; tensor var_3530_perm_0 = const()[name = tensor("op_3530_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3531 = const()[name = tensor("op_3531"), val = tensor([1, -1, 1024])]; tensor var_3530_cast_fp16 = transpose(perm = var_3530_perm_0, x = x_377_cast_fp16)[name = tensor("transpose_232")]; tensor input_771_cast_fp16 = reshape(shape = var_3531, x = var_3530_cast_fp16)[name = tensor("input_771_cast_fp16")]; tensor encoder_layers_14_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293574528))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294361024))), name = tensor("encoder_layers_14_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_14_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294361216)))]; tensor linear_133_cast_fp16 = linear(bias = encoder_layers_14_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_14_self_attn_linear_out_weight_to_fp16_palettized, x = input_771_cast_fp16)[name = tensor("linear_133_cast_fp16")]; tensor input_775_cast_fp16 = add(x = input_765_cast_fp16, y = linear_133_cast_fp16)[name = tensor("input_775_cast_fp16")]; tensor x_381_axes_0 = const()[name = tensor("x_381_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294363328)))]; tensor encoder_layers_14_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294365440)))]; tensor x_381_cast_fp16 = layer_norm(axes = x_381_axes_0, beta = encoder_layers_14_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_14_norm_conv_weight_to_fp16, x = input_775_cast_fp16)[name = tensor("x_381_cast_fp16")]; tensor input_777_perm_0 = const()[name = tensor("input_777_perm_0"), val = tensor([0, 2, 1])]; tensor input_779_pad_type_0 = const()[name = tensor("input_779_pad_type_0"), val = tensor("valid")]; tensor input_779_strides_0 = const()[name = tensor("input_779_strides_0"), val = tensor([1])]; tensor input_779_pad_0 = const()[name = tensor("input_779_pad_0"), val = tensor([0, 0])]; tensor input_779_dilations_0 = const()[name = tensor("input_779_dilations_0"), val = tensor([1])]; tensor input_779_groups_0 = const()[name = tensor("input_779_groups_0"), val = tensor(1)]; tensor encoder_layers_14_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_14_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294367552))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296464768))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_777_cast_fp16 = transpose(perm = input_777_perm_0, x = x_381_cast_fp16)[name = tensor("transpose_231")]; tensor input_779_cast_fp16 = conv(dilations = input_779_dilations_0, groups = input_779_groups_0, pad = input_779_pad_0, pad_type = input_779_pad_type_0, strides = input_779_strides_0, weight = encoder_layers_14_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_777_cast_fp16)[name = tensor("input_779_cast_fp16")]; tensor x_383_split_num_splits_0 = const()[name = tensor("x_383_split_num_splits_0"), val = tensor(2)]; tensor x_383_split_axis_0 = const()[name = tensor("x_383_split_axis_0"), val = tensor(1)]; tensor x_383_split_cast_fp16_0, tensor x_383_split_cast_fp16_1 = split(axis = x_383_split_axis_0, num_splits = x_383_split_num_splits_0, x = input_779_cast_fp16)[name = tensor("x_383_split_cast_fp16")]; tensor x_383_split_1_sigmoid_cast_fp16 = sigmoid(x = x_383_split_cast_fp16_1)[name = tensor("x_383_split_1_sigmoid_cast_fp16")]; tensor x_383_cast_fp16 = mul(x = x_383_split_cast_fp16_0, y = x_383_split_1_sigmoid_cast_fp16)[name = tensor("x_383_cast_fp16")]; tensor input_781_cast_fp16 = select(a = var_44_to_fp16, b = x_383_cast_fp16, cond = var_575)[name = tensor("input_781_cast_fp16")]; tensor new_x_59_interleave_0 = const()[name = tensor("new_x_59_interleave_0"), val = tensor(false)]; tensor new_x_59_cast_fp16 = concat(axis = var_59, interleave = new_x_59_interleave_0, values = (cache_59_cast_fp16, input_781_cast_fp16))[name = tensor("new_x_59_cast_fp16")]; tensor var_3570_begin_0 = const()[name = tensor("op_3570_begin_0"), val = tensor([0, 0, 7])]; tensor var_3570_end_0 = const()[name = tensor("op_3570_end_0"), val = tensor([1, 1024, 15])]; tensor var_3570_end_mask_0 = const()[name = tensor("op_3570_end_mask_0"), val = tensor([true, true, true])]; tensor var_3570_cast_fp16 = slice_by_index(begin = var_3570_begin_0, end = var_3570_end_0, end_mask = var_3570_end_mask_0, x = new_x_59_cast_fp16)[name = tensor("op_3570_cast_fp16")]; tensor x_385_pad_type_0 = const()[name = tensor("x_385_pad_type_0"), val = tensor("valid")]; tensor x_385_groups_0 = const()[name = tensor("x_385_groups_0"), val = tensor(1024)]; tensor x_385_strides_0 = const()[name = tensor("x_385_strides_0"), val = tensor([1])]; tensor x_385_pad_0 = const()[name = tensor("x_385_pad_0"), val = tensor([0, 0])]; tensor x_385_dilations_0 = const()[name = tensor("x_385_dilations_0"), val = tensor([1])]; tensor encoder_layers_14_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_14_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296468928))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296478208))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_385_cast_fp16 = conv(dilations = x_385_dilations_0, groups = x_385_groups_0, pad = x_385_pad_0, pad_type = x_385_pad_type_0, strides = x_385_strides_0, weight = encoder_layers_14_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_59_cast_fp16)[name = tensor("x_385_cast_fp16")]; tensor input_783_perm_0 = const()[name = tensor("input_783_perm_0"), val = tensor([0, 2, 1])]; tensor x_387_axes_0 = const()[name = tensor("x_387_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_14_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296480320)))]; tensor encoder_layers_14_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_14_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296482432)))]; tensor input_783_cast_fp16 = transpose(perm = input_783_perm_0, x = x_385_cast_fp16)[name = tensor("transpose_230")]; tensor x_387_cast_fp16 = layer_norm(axes = x_387_axes_0, beta = encoder_layers_14_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_14_conv_batch_norm_weight_to_fp16, x = input_783_cast_fp16)[name = tensor("x_387_cast_fp16")]; tensor input_785_perm_0 = const()[name = tensor("input_785_perm_0"), val = tensor([0, 2, 1])]; tensor input_785_cast_fp16 = transpose(perm = input_785_perm_0, x = x_387_cast_fp16)[name = tensor("transpose_229")]; tensor input_787_cast_fp16 = silu(x = input_785_cast_fp16)[name = tensor("input_787_cast_fp16")]; tensor x_389_pad_type_0 = const()[name = tensor("x_389_pad_type_0"), val = tensor("valid")]; tensor x_389_strides_0 = const()[name = tensor("x_389_strides_0"), val = tensor([1])]; tensor x_389_pad_0 = const()[name = tensor("x_389_pad_0"), val = tensor([0, 0])]; tensor x_389_dilations_0 = const()[name = tensor("x_389_dilations_0"), val = tensor([1])]; tensor x_389_groups_0 = const()[name = tensor("x_389_groups_0"), val = tensor(1)]; tensor encoder_layers_14_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_14_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296484544))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297533184))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_389_cast_fp16 = conv(dilations = x_389_dilations_0, groups = x_389_groups_0, pad = x_389_pad_0, pad_type = x_389_pad_type_0, strides = x_389_strides_0, weight = encoder_layers_14_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_787_cast_fp16)[name = tensor("x_389_cast_fp16")]; tensor input_789_perm_0 = const()[name = tensor("input_789_perm_0"), val = tensor([0, 2, 1])]; tensor input_789_cast_fp16 = transpose(perm = input_789_perm_0, x = x_389_cast_fp16)[name = tensor("transpose_228")]; tensor input_791_cast_fp16 = add(x = input_775_cast_fp16, y = input_789_cast_fp16)[name = tensor("input_791_cast_fp16")]; tensor input_793_axes_0 = const()[name = tensor("input_793_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297535296)))]; tensor encoder_layers_14_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297537408)))]; tensor input_793_cast_fp16 = layer_norm(axes = input_793_axes_0, beta = encoder_layers_14_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_14_norm_feed_forward2_weight_to_fp16, x = input_791_cast_fp16)[name = tensor("input_793_cast_fp16")]; tensor encoder_layers_14_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297539520))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(300685312))), name = tensor("encoder_layers_14_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_14_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_14_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(300685504)))]; tensor linear_134_cast_fp16 = linear(bias = encoder_layers_14_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_14_feed_forward2_linear1_weight_to_fp16_palettized, x = input_793_cast_fp16)[name = tensor("linear_134_cast_fp16")]; tensor input_797_cast_fp16 = silu(x = linear_134_cast_fp16)[name = tensor("input_797_cast_fp16")]; tensor encoder_layers_14_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(300693760))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303839552))), name = tensor("encoder_layers_14_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_14_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_14_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303839744)))]; tensor linear_135_cast_fp16 = linear(bias = encoder_layers_14_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_14_feed_forward2_linear2_weight_to_fp16_palettized, x = input_797_cast_fp16)[name = tensor("linear_135_cast_fp16")]; tensor var_3613_to_fp16 = const()[name = tensor("op_3613_to_fp16"), val = tensor(0x1p-1)]; tensor var_3614_cast_fp16 = mul(x = linear_135_cast_fp16, y = var_3613_to_fp16)[name = tensor("op_3614_cast_fp16")]; tensor input_803_cast_fp16 = add(x = input_791_cast_fp16, y = var_3614_cast_fp16)[name = tensor("input_803_cast_fp16")]; tensor input_805_axes_0 = const()[name = tensor("input_805_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303841856)))]; tensor encoder_layers_14_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303843968)))]; tensor input_805_cast_fp16 = layer_norm(axes = input_805_axes_0, beta = encoder_layers_14_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_14_norm_out_weight_to_fp16, x = input_803_cast_fp16)[name = tensor("input_805_cast_fp16")]; tensor cache_61_begin_0 = const()[name = tensor("cache_61_begin_0"), val = tensor([15, 0, 0, 0])]; tensor cache_61_end_0 = const()[name = tensor("cache_61_end_0"), val = tensor([16, 1, 42, 1024])]; tensor cache_61_end_mask_0 = const()[name = tensor("cache_61_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_61_squeeze_mask_0 = const()[name = tensor("cache_61_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_61_cast_fp16 = slice_by_index(begin = cache_61_begin_0, end = cache_61_end_0, end_mask = cache_61_end_mask_0, squeeze_mask = cache_61_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_61_cast_fp16")]; tensor cache_63_begin_0 = const()[name = tensor("cache_63_begin_0"), val = tensor([15, 0, 0, 0])]; tensor cache_63_end_0 = const()[name = tensor("cache_63_end_0"), val = tensor([16, 1, 1024, 8])]; tensor cache_63_end_mask_0 = const()[name = tensor("cache_63_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_63_squeeze_mask_0 = const()[name = tensor("cache_63_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_63_cast_fp16 = slice_by_index(begin = cache_63_begin_0, end = cache_63_end_0, end_mask = cache_63_end_mask_0, squeeze_mask = cache_63_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_63_cast_fp16")]; tensor input_807_axes_0 = const()[name = tensor("input_807_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303846080)))]; tensor encoder_layers_15_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303848192)))]; tensor input_807_cast_fp16 = layer_norm(axes = input_807_axes_0, beta = encoder_layers_15_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_15_norm_feed_forward1_weight_to_fp16, x = input_805_cast_fp16)[name = tensor("input_807_cast_fp16")]; tensor encoder_layers_15_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303850304))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(306996096))), name = tensor("encoder_layers_15_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_15_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_15_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(306996288)))]; tensor linear_136_cast_fp16 = linear(bias = encoder_layers_15_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_15_feed_forward1_linear1_weight_to_fp16_palettized, x = input_807_cast_fp16)[name = tensor("linear_136_cast_fp16")]; tensor input_811_cast_fp16 = silu(x = linear_136_cast_fp16)[name = tensor("input_811_cast_fp16")]; tensor encoder_layers_15_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307004544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(310150336))), name = tensor("encoder_layers_15_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_15_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_15_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(310150528)))]; tensor linear_137_cast_fp16 = linear(bias = encoder_layers_15_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_15_feed_forward1_linear2_weight_to_fp16_palettized, x = input_811_cast_fp16)[name = tensor("linear_137_cast_fp16")]; tensor var_3650_to_fp16 = const()[name = tensor("op_3650_to_fp16"), val = tensor(0x1p-1)]; tensor var_3651_cast_fp16 = mul(x = linear_137_cast_fp16, y = var_3650_to_fp16)[name = tensor("op_3651_cast_fp16")]; tensor input_817_cast_fp16 = add(x = input_805_cast_fp16, y = var_3651_cast_fp16)[name = tensor("input_817_cast_fp16")]; tensor key_31_axes_0 = const()[name = tensor("key_31_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(310152640)))]; tensor encoder_layers_15_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(310154752)))]; tensor key_31_cast_fp16 = layer_norm(axes = key_31_axes_0, beta = encoder_layers_15_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_15_norm_self_att_weight_to_fp16, x = input_817_cast_fp16)[name = tensor("key_31_cast_fp16")]; tensor input_819_interleave_0 = const()[name = tensor("input_819_interleave_0"), val = tensor(false)]; tensor input_819_cast_fp16 = concat(axis = var_68, interleave = input_819_interleave_0, values = (cache_61_cast_fp16, key_31_cast_fp16))[name = tensor("input_819_cast_fp16")]; tensor var_3673_begin_0 = const()[name = tensor("op_3673_begin_0"), val = tensor([0, 7, 0])]; tensor var_3673_end_0 = const()[name = tensor("op_3673_end_0"), val = tensor([1, 42, 1024])]; tensor var_3673_end_mask_0 = const()[name = tensor("op_3673_end_mask_0"), val = tensor([true, true, true])]; tensor var_3673_cast_fp16 = slice_by_index(begin = var_3673_begin_0, end = var_3673_end_0, end_mask = var_3673_end_mask_0, x = cache_61_cast_fp16)[name = tensor("op_3673_cast_fp16")]; tensor var_3679_interleave_0 = const()[name = tensor("op_3679_interleave_0"), val = tensor(false)]; tensor var_3679_cast_fp16 = concat(axis = var_68, interleave = var_3679_interleave_0, values = (var_3673_cast_fp16, key_31_cast_fp16))[name = tensor("op_3679_cast_fp16")]; tensor encoder_layers_15_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(310156864))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(310943360))), name = tensor("encoder_layers_15_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_15_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(310943552)))]; tensor linear_138_cast_fp16 = linear(bias = encoder_layers_15_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_15_self_attn_linear_q_weight_to_fp16_palettized, x = key_31_cast_fp16)[name = tensor("linear_138_cast_fp16")]; tensor var_3684 = const()[name = tensor("op_3684"), val = tensor([1, -1, 8, 128])]; tensor q_91_cast_fp16 = reshape(shape = var_3684, x = linear_138_cast_fp16)[name = tensor("q_91_cast_fp16")]; tensor encoder_layers_15_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(310945664))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311732160))), name = tensor("encoder_layers_15_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_15_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311732352)))]; tensor linear_139_cast_fp16 = linear(bias = encoder_layers_15_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_15_self_attn_linear_k_weight_to_fp16_palettized, x = input_819_cast_fp16)[name = tensor("linear_139_cast_fp16")]; tensor var_3689 = const()[name = tensor("op_3689"), val = tensor([1, -1, 8, 128])]; tensor k_61_cast_fp16 = reshape(shape = var_3689, x = linear_139_cast_fp16)[name = tensor("k_61_cast_fp16")]; tensor encoder_layers_15_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311734464))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312520960))), name = tensor("encoder_layers_15_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_15_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312521152)))]; tensor linear_140_cast_fp16 = linear(bias = encoder_layers_15_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_15_self_attn_linear_v_weight_to_fp16_palettized, x = input_819_cast_fp16)[name = tensor("linear_140_cast_fp16")]; tensor var_3694 = const()[name = tensor("op_3694"), val = tensor([1, -1, 8, 128])]; tensor v_31_cast_fp16 = reshape(shape = var_3694, x = linear_140_cast_fp16)[name = tensor("v_31_cast_fp16")]; tensor value_39_perm_0 = const()[name = tensor("value_39_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_15_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312523264)))]; tensor var_3707_cast_fp16 = add(x = q_91_cast_fp16, y = encoder_layers_15_self_attn_pos_bias_u_to_fp16)[name = tensor("op_3707_cast_fp16")]; tensor encoder_layers_15_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312525376)))]; tensor var_3709_cast_fp16 = add(x = q_91_cast_fp16, y = encoder_layers_15_self_attn_pos_bias_v_to_fp16)[name = tensor("op_3709_cast_fp16")]; tensor q_with_bias_v_31_perm_0 = const()[name = tensor("q_with_bias_v_31_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_397_transpose_x_0 = const()[name = tensor("x_397_transpose_x_0"), val = tensor(false)]; tensor x_397_transpose_y_0 = const()[name = tensor("x_397_transpose_y_0"), val = tensor(false)]; tensor op_3711_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_3711_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312527488))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312627072))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312626880)))]; tensor q_with_bias_v_31_cast_fp16 = transpose(perm = q_with_bias_v_31_perm_0, x = var_3709_cast_fp16)[name = tensor("transpose_227")]; tensor x_397_cast_fp16 = matmul(transpose_x = x_397_transpose_x_0, transpose_y = x_397_transpose_y_0, x = q_with_bias_v_31_cast_fp16, y = op_3711_to_fp16_quantized)[name = tensor("x_397_cast_fp16")]; tensor x_399_pad_0 = const()[name = tensor("x_399_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_399_mode_0 = const()[name = tensor("x_399_mode_0"), val = tensor("constant")]; tensor const_274_to_fp16 = const()[name = tensor("const_274_to_fp16"), val = tensor(0x0p+0)]; tensor x_399_cast_fp16 = pad(constant_val = const_274_to_fp16, mode = x_399_mode_0, pad = x_399_pad_0, x = x_397_cast_fp16)[name = tensor("x_399_cast_fp16")]; tensor var_3719 = const()[name = tensor("op_3719"), val = tensor([1, 8, -1, 7])]; tensor x_401_cast_fp16 = reshape(shape = var_3719, x = x_399_cast_fp16)[name = tensor("x_401_cast_fp16")]; tensor var_3723_begin_0 = const()[name = tensor("op_3723_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_3723_end_0 = const()[name = tensor("op_3723_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_3723_end_mask_0 = const()[name = tensor("op_3723_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_3723_cast_fp16 = slice_by_index(begin = var_3723_begin_0, end = var_3723_end_0, end_mask = var_3723_end_mask_0, x = x_401_cast_fp16)[name = tensor("op_3723_cast_fp16")]; tensor var_3724 = const()[name = tensor("op_3724"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_61_cast_fp16 = reshape(shape = var_3724, x = var_3723_cast_fp16)[name = tensor("matrix_bd_61_cast_fp16")]; tensor matrix_ac_31_transpose_x_0 = const()[name = tensor("matrix_ac_31_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_31_transpose_y_0 = const()[name = tensor("matrix_ac_31_transpose_y_0"), val = tensor(false)]; tensor transpose_126_perm_0 = const()[name = tensor("transpose_126_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_127_perm_0 = const()[name = tensor("transpose_127_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_127 = transpose(perm = transpose_127_perm_0, x = k_61_cast_fp16)[name = tensor("transpose_225")]; tensor transpose_126 = transpose(perm = transpose_126_perm_0, x = var_3707_cast_fp16)[name = tensor("transpose_226")]; tensor matrix_ac_31_cast_fp16 = matmul(transpose_x = matrix_ac_31_transpose_x_0, transpose_y = matrix_ac_31_transpose_y_0, x = transpose_126, y = transpose_127)[name = tensor("matrix_ac_31_cast_fp16")]; tensor matrix_bd_63_begin_0 = const()[name = tensor("matrix_bd_63_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_63_end_0 = const()[name = tensor("matrix_bd_63_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_63_end_mask_0 = const()[name = tensor("matrix_bd_63_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_63_cast_fp16 = slice_by_index(begin = matrix_bd_63_begin_0, end = matrix_bd_63_end_0, end_mask = matrix_bd_63_end_mask_0, x = matrix_bd_61_cast_fp16)[name = tensor("matrix_bd_63_cast_fp16")]; tensor var_3733_cast_fp16 = add(x = matrix_ac_31_cast_fp16, y = matrix_bd_63_cast_fp16)[name = tensor("op_3733_cast_fp16")]; tensor _inversed_scores_61_y_0_to_fp16 = const()[name = tensor("_inversed_scores_61_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_61_cast_fp16 = mul(x = var_3733_cast_fp16, y = _inversed_scores_61_y_0_to_fp16)[name = tensor("_inversed_scores_61_cast_fp16")]; tensor scores_63_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_61_cast_fp16, cond = mask_11)[name = tensor("scores_63_cast_fp16")]; tensor var_3739_cast_fp16 = softmax(axis = var_59, x = scores_63_cast_fp16)[name = tensor("op_3739_cast_fp16")]; tensor input_821_cast_fp16 = select(a = var_44_to_fp16, b = var_3739_cast_fp16, cond = mask_11)[name = tensor("input_821_cast_fp16")]; tensor x_403_transpose_x_0 = const()[name = tensor("x_403_transpose_x_0"), val = tensor(false)]; tensor x_403_transpose_y_0 = const()[name = tensor("x_403_transpose_y_0"), val = tensor(false)]; tensor value_39_cast_fp16 = transpose(perm = value_39_perm_0, x = v_31_cast_fp16)[name = tensor("transpose_224")]; tensor x_403_cast_fp16 = matmul(transpose_x = x_403_transpose_x_0, transpose_y = x_403_transpose_y_0, x = input_821_cast_fp16, y = value_39_cast_fp16)[name = tensor("x_403_cast_fp16")]; tensor var_3743_perm_0 = const()[name = tensor("op_3743_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3744 = const()[name = tensor("op_3744"), val = tensor([1, -1, 1024])]; tensor var_3743_cast_fp16 = transpose(perm = var_3743_perm_0, x = x_403_cast_fp16)[name = tensor("transpose_223")]; tensor input_823_cast_fp16 = reshape(shape = var_3744, x = var_3743_cast_fp16)[name = tensor("input_823_cast_fp16")]; tensor encoder_layers_15_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312627392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(313413888))), name = tensor("encoder_layers_15_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_15_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(313414080)))]; tensor linear_142_cast_fp16 = linear(bias = encoder_layers_15_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_15_self_attn_linear_out_weight_to_fp16_palettized, x = input_823_cast_fp16)[name = tensor("linear_142_cast_fp16")]; tensor input_827_cast_fp16 = add(x = input_817_cast_fp16, y = linear_142_cast_fp16)[name = tensor("input_827_cast_fp16")]; tensor x_407_axes_0 = const()[name = tensor("x_407_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(313416192)))]; tensor encoder_layers_15_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(313418304)))]; tensor x_407_cast_fp16 = layer_norm(axes = x_407_axes_0, beta = encoder_layers_15_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_15_norm_conv_weight_to_fp16, x = input_827_cast_fp16)[name = tensor("x_407_cast_fp16")]; tensor input_829_perm_0 = const()[name = tensor("input_829_perm_0"), val = tensor([0, 2, 1])]; tensor input_831_pad_type_0 = const()[name = tensor("input_831_pad_type_0"), val = tensor("valid")]; tensor input_831_strides_0 = const()[name = tensor("input_831_strides_0"), val = tensor([1])]; tensor input_831_pad_0 = const()[name = tensor("input_831_pad_0"), val = tensor([0, 0])]; tensor input_831_dilations_0 = const()[name = tensor("input_831_dilations_0"), val = tensor([1])]; tensor input_831_groups_0 = const()[name = tensor("input_831_groups_0"), val = tensor(1)]; tensor encoder_layers_15_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_15_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(313420416))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(315517632))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_829_cast_fp16 = transpose(perm = input_829_perm_0, x = x_407_cast_fp16)[name = tensor("transpose_222")]; tensor input_831_cast_fp16 = conv(dilations = input_831_dilations_0, groups = input_831_groups_0, pad = input_831_pad_0, pad_type = input_831_pad_type_0, strides = input_831_strides_0, weight = encoder_layers_15_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_829_cast_fp16)[name = tensor("input_831_cast_fp16")]; tensor x_409_split_num_splits_0 = const()[name = tensor("x_409_split_num_splits_0"), val = tensor(2)]; tensor x_409_split_axis_0 = const()[name = tensor("x_409_split_axis_0"), val = tensor(1)]; tensor x_409_split_cast_fp16_0, tensor x_409_split_cast_fp16_1 = split(axis = x_409_split_axis_0, num_splits = x_409_split_num_splits_0, x = input_831_cast_fp16)[name = tensor("x_409_split_cast_fp16")]; tensor x_409_split_1_sigmoid_cast_fp16 = sigmoid(x = x_409_split_cast_fp16_1)[name = tensor("x_409_split_1_sigmoid_cast_fp16")]; tensor x_409_cast_fp16 = mul(x = x_409_split_cast_fp16_0, y = x_409_split_1_sigmoid_cast_fp16)[name = tensor("x_409_cast_fp16")]; tensor input_833_cast_fp16 = select(a = var_44_to_fp16, b = x_409_cast_fp16, cond = var_575)[name = tensor("input_833_cast_fp16")]; tensor new_x_63_interleave_0 = const()[name = tensor("new_x_63_interleave_0"), val = tensor(false)]; tensor new_x_63_cast_fp16 = concat(axis = var_59, interleave = new_x_63_interleave_0, values = (cache_63_cast_fp16, input_833_cast_fp16))[name = tensor("new_x_63_cast_fp16")]; tensor var_3783_begin_0 = const()[name = tensor("op_3783_begin_0"), val = tensor([0, 0, 7])]; tensor var_3783_end_0 = const()[name = tensor("op_3783_end_0"), val = tensor([1, 1024, 15])]; tensor var_3783_end_mask_0 = const()[name = tensor("op_3783_end_mask_0"), val = tensor([true, true, true])]; tensor var_3783_cast_fp16 = slice_by_index(begin = var_3783_begin_0, end = var_3783_end_0, end_mask = var_3783_end_mask_0, x = new_x_63_cast_fp16)[name = tensor("op_3783_cast_fp16")]; tensor x_411_pad_type_0 = const()[name = tensor("x_411_pad_type_0"), val = tensor("valid")]; tensor x_411_groups_0 = const()[name = tensor("x_411_groups_0"), val = tensor(1024)]; tensor x_411_strides_0 = const()[name = tensor("x_411_strides_0"), val = tensor([1])]; tensor x_411_pad_0 = const()[name = tensor("x_411_pad_0"), val = tensor([0, 0])]; tensor x_411_dilations_0 = const()[name = tensor("x_411_dilations_0"), val = tensor([1])]; tensor encoder_layers_15_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_15_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(315521792))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(315531072))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_411_cast_fp16 = conv(dilations = x_411_dilations_0, groups = x_411_groups_0, pad = x_411_pad_0, pad_type = x_411_pad_type_0, strides = x_411_strides_0, weight = encoder_layers_15_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_63_cast_fp16)[name = tensor("x_411_cast_fp16")]; tensor input_835_perm_0 = const()[name = tensor("input_835_perm_0"), val = tensor([0, 2, 1])]; tensor x_413_axes_0 = const()[name = tensor("x_413_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_15_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(315533184)))]; tensor encoder_layers_15_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_15_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(315535296)))]; tensor input_835_cast_fp16 = transpose(perm = input_835_perm_0, x = x_411_cast_fp16)[name = tensor("transpose_221")]; tensor x_413_cast_fp16 = layer_norm(axes = x_413_axes_0, beta = encoder_layers_15_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_15_conv_batch_norm_weight_to_fp16, x = input_835_cast_fp16)[name = tensor("x_413_cast_fp16")]; tensor input_837_perm_0 = const()[name = tensor("input_837_perm_0"), val = tensor([0, 2, 1])]; tensor input_837_cast_fp16 = transpose(perm = input_837_perm_0, x = x_413_cast_fp16)[name = tensor("transpose_220")]; tensor input_839_cast_fp16 = silu(x = input_837_cast_fp16)[name = tensor("input_839_cast_fp16")]; tensor x_415_pad_type_0 = const()[name = tensor("x_415_pad_type_0"), val = tensor("valid")]; tensor x_415_strides_0 = const()[name = tensor("x_415_strides_0"), val = tensor([1])]; tensor x_415_pad_0 = const()[name = tensor("x_415_pad_0"), val = tensor([0, 0])]; tensor x_415_dilations_0 = const()[name = tensor("x_415_dilations_0"), val = tensor([1])]; tensor x_415_groups_0 = const()[name = tensor("x_415_groups_0"), val = tensor(1)]; tensor encoder_layers_15_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_15_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(315537408))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316586048))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_415_cast_fp16 = conv(dilations = x_415_dilations_0, groups = x_415_groups_0, pad = x_415_pad_0, pad_type = x_415_pad_type_0, strides = x_415_strides_0, weight = encoder_layers_15_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_839_cast_fp16)[name = tensor("x_415_cast_fp16")]; tensor input_841_perm_0 = const()[name = tensor("input_841_perm_0"), val = tensor([0, 2, 1])]; tensor input_841_cast_fp16 = transpose(perm = input_841_perm_0, x = x_415_cast_fp16)[name = tensor("transpose_219")]; tensor input_843_cast_fp16 = add(x = input_827_cast_fp16, y = input_841_cast_fp16)[name = tensor("input_843_cast_fp16")]; tensor input_845_axes_0 = const()[name = tensor("input_845_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316588160)))]; tensor encoder_layers_15_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316590272)))]; tensor input_845_cast_fp16 = layer_norm(axes = input_845_axes_0, beta = encoder_layers_15_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_15_norm_feed_forward2_weight_to_fp16, x = input_843_cast_fp16)[name = tensor("input_845_cast_fp16")]; tensor encoder_layers_15_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316592384))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319738176))), name = tensor("encoder_layers_15_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_15_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_15_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319738368)))]; tensor linear_143_cast_fp16 = linear(bias = encoder_layers_15_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_15_feed_forward2_linear1_weight_to_fp16_palettized, x = input_845_cast_fp16)[name = tensor("linear_143_cast_fp16")]; tensor input_849_cast_fp16 = silu(x = linear_143_cast_fp16)[name = tensor("input_849_cast_fp16")]; tensor encoder_layers_15_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319746624))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322892416))), name = tensor("encoder_layers_15_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_15_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_15_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322892608)))]; tensor linear_144_cast_fp16 = linear(bias = encoder_layers_15_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_15_feed_forward2_linear2_weight_to_fp16_palettized, x = input_849_cast_fp16)[name = tensor("linear_144_cast_fp16")]; tensor var_3826_to_fp16 = const()[name = tensor("op_3826_to_fp16"), val = tensor(0x1p-1)]; tensor var_3827_cast_fp16 = mul(x = linear_144_cast_fp16, y = var_3826_to_fp16)[name = tensor("op_3827_cast_fp16")]; tensor input_855_cast_fp16 = add(x = input_843_cast_fp16, y = var_3827_cast_fp16)[name = tensor("input_855_cast_fp16")]; tensor input_857_axes_0 = const()[name = tensor("input_857_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322894720)))]; tensor encoder_layers_15_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322896832)))]; tensor input_857_cast_fp16 = layer_norm(axes = input_857_axes_0, beta = encoder_layers_15_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_15_norm_out_weight_to_fp16, x = input_855_cast_fp16)[name = tensor("input_857_cast_fp16")]; tensor cache_65_begin_0 = const()[name = tensor("cache_65_begin_0"), val = tensor([16, 0, 0, 0])]; tensor cache_65_end_0 = const()[name = tensor("cache_65_end_0"), val = tensor([17, 1, 42, 1024])]; tensor cache_65_end_mask_0 = const()[name = tensor("cache_65_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_65_squeeze_mask_0 = const()[name = tensor("cache_65_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_65_cast_fp16 = slice_by_index(begin = cache_65_begin_0, end = cache_65_end_0, end_mask = cache_65_end_mask_0, squeeze_mask = cache_65_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_65_cast_fp16")]; tensor cache_67_begin_0 = const()[name = tensor("cache_67_begin_0"), val = tensor([16, 0, 0, 0])]; tensor cache_67_end_0 = const()[name = tensor("cache_67_end_0"), val = tensor([17, 1, 1024, 8])]; tensor cache_67_end_mask_0 = const()[name = tensor("cache_67_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_67_squeeze_mask_0 = const()[name = tensor("cache_67_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_67_cast_fp16 = slice_by_index(begin = cache_67_begin_0, end = cache_67_end_0, end_mask = cache_67_end_mask_0, squeeze_mask = cache_67_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_67_cast_fp16")]; tensor input_859_axes_0 = const()[name = tensor("input_859_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322898944)))]; tensor encoder_layers_16_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322901056)))]; tensor input_859_cast_fp16 = layer_norm(axes = input_859_axes_0, beta = encoder_layers_16_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_16_norm_feed_forward1_weight_to_fp16, x = input_857_cast_fp16)[name = tensor("input_859_cast_fp16")]; tensor encoder_layers_16_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322903168))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(326048960))), name = tensor("encoder_layers_16_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_16_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_16_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(326049152)))]; tensor linear_145_cast_fp16 = linear(bias = encoder_layers_16_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_16_feed_forward1_linear1_weight_to_fp16_palettized, x = input_859_cast_fp16)[name = tensor("linear_145_cast_fp16")]; tensor input_863_cast_fp16 = silu(x = linear_145_cast_fp16)[name = tensor("input_863_cast_fp16")]; tensor encoder_layers_16_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(326057408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329203200))), name = tensor("encoder_layers_16_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_16_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_16_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329203392)))]; tensor linear_146_cast_fp16 = linear(bias = encoder_layers_16_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_16_feed_forward1_linear2_weight_to_fp16_palettized, x = input_863_cast_fp16)[name = tensor("linear_146_cast_fp16")]; tensor var_3863_to_fp16 = const()[name = tensor("op_3863_to_fp16"), val = tensor(0x1p-1)]; tensor var_3864_cast_fp16 = mul(x = linear_146_cast_fp16, y = var_3863_to_fp16)[name = tensor("op_3864_cast_fp16")]; tensor input_869_cast_fp16 = add(x = input_857_cast_fp16, y = var_3864_cast_fp16)[name = tensor("input_869_cast_fp16")]; tensor key_33_axes_0 = const()[name = tensor("key_33_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329205504)))]; tensor encoder_layers_16_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329207616)))]; tensor key_33_cast_fp16 = layer_norm(axes = key_33_axes_0, beta = encoder_layers_16_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_16_norm_self_att_weight_to_fp16, x = input_869_cast_fp16)[name = tensor("key_33_cast_fp16")]; tensor input_871_interleave_0 = const()[name = tensor("input_871_interleave_0"), val = tensor(false)]; tensor input_871_cast_fp16 = concat(axis = var_68, interleave = input_871_interleave_0, values = (cache_65_cast_fp16, key_33_cast_fp16))[name = tensor("input_871_cast_fp16")]; tensor var_3886_begin_0 = const()[name = tensor("op_3886_begin_0"), val = tensor([0, 7, 0])]; tensor var_3886_end_0 = const()[name = tensor("op_3886_end_0"), val = tensor([1, 42, 1024])]; tensor var_3886_end_mask_0 = const()[name = tensor("op_3886_end_mask_0"), val = tensor([true, true, true])]; tensor var_3886_cast_fp16 = slice_by_index(begin = var_3886_begin_0, end = var_3886_end_0, end_mask = var_3886_end_mask_0, x = cache_65_cast_fp16)[name = tensor("op_3886_cast_fp16")]; tensor var_3892_interleave_0 = const()[name = tensor("op_3892_interleave_0"), val = tensor(false)]; tensor var_3892_cast_fp16 = concat(axis = var_68, interleave = var_3892_interleave_0, values = (var_3886_cast_fp16, key_33_cast_fp16))[name = tensor("op_3892_cast_fp16")]; tensor encoder_layers_16_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329209728))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329996224))), name = tensor("encoder_layers_16_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_16_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329996416)))]; tensor linear_147_cast_fp16 = linear(bias = encoder_layers_16_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_16_self_attn_linear_q_weight_to_fp16_palettized, x = key_33_cast_fp16)[name = tensor("linear_147_cast_fp16")]; tensor var_3897 = const()[name = tensor("op_3897"), val = tensor([1, -1, 8, 128])]; tensor q_97_cast_fp16 = reshape(shape = var_3897, x = linear_147_cast_fp16)[name = tensor("q_97_cast_fp16")]; tensor encoder_layers_16_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329998528))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(330785024))), name = tensor("encoder_layers_16_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_16_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(330785216)))]; tensor linear_148_cast_fp16 = linear(bias = encoder_layers_16_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_16_self_attn_linear_k_weight_to_fp16_palettized, x = input_871_cast_fp16)[name = tensor("linear_148_cast_fp16")]; tensor var_3902 = const()[name = tensor("op_3902"), val = tensor([1, -1, 8, 128])]; tensor k_65_cast_fp16 = reshape(shape = var_3902, x = linear_148_cast_fp16)[name = tensor("k_65_cast_fp16")]; tensor encoder_layers_16_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(330787328))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(331573824))), name = tensor("encoder_layers_16_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_16_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(331574016)))]; tensor linear_149_cast_fp16 = linear(bias = encoder_layers_16_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_16_self_attn_linear_v_weight_to_fp16_palettized, x = input_871_cast_fp16)[name = tensor("linear_149_cast_fp16")]; tensor var_3907 = const()[name = tensor("op_3907"), val = tensor([1, -1, 8, 128])]; tensor v_33_cast_fp16 = reshape(shape = var_3907, x = linear_149_cast_fp16)[name = tensor("v_33_cast_fp16")]; tensor value_41_perm_0 = const()[name = tensor("value_41_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_16_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(331576128)))]; tensor var_3920_cast_fp16 = add(x = q_97_cast_fp16, y = encoder_layers_16_self_attn_pos_bias_u_to_fp16)[name = tensor("op_3920_cast_fp16")]; tensor encoder_layers_16_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(331578240)))]; tensor var_3922_cast_fp16 = add(x = q_97_cast_fp16, y = encoder_layers_16_self_attn_pos_bias_v_to_fp16)[name = tensor("op_3922_cast_fp16")]; tensor q_with_bias_v_33_perm_0 = const()[name = tensor("q_with_bias_v_33_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_423_transpose_x_0 = const()[name = tensor("x_423_transpose_x_0"), val = tensor(false)]; tensor x_423_transpose_y_0 = const()[name = tensor("x_423_transpose_y_0"), val = tensor(false)]; tensor op_3924_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_3924_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(331580352))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(331679936))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(331679744)))]; tensor q_with_bias_v_33_cast_fp16 = transpose(perm = q_with_bias_v_33_perm_0, x = var_3922_cast_fp16)[name = tensor("transpose_218")]; tensor x_423_cast_fp16 = matmul(transpose_x = x_423_transpose_x_0, transpose_y = x_423_transpose_y_0, x = q_with_bias_v_33_cast_fp16, y = op_3924_to_fp16_quantized)[name = tensor("x_423_cast_fp16")]; tensor x_425_pad_0 = const()[name = tensor("x_425_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_425_mode_0 = const()[name = tensor("x_425_mode_0"), val = tensor("constant")]; tensor const_287_to_fp16 = const()[name = tensor("const_287_to_fp16"), val = tensor(0x0p+0)]; tensor x_425_cast_fp16 = pad(constant_val = const_287_to_fp16, mode = x_425_mode_0, pad = x_425_pad_0, x = x_423_cast_fp16)[name = tensor("x_425_cast_fp16")]; tensor var_3932 = const()[name = tensor("op_3932"), val = tensor([1, 8, -1, 7])]; tensor x_427_cast_fp16 = reshape(shape = var_3932, x = x_425_cast_fp16)[name = tensor("x_427_cast_fp16")]; tensor var_3936_begin_0 = const()[name = tensor("op_3936_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_3936_end_0 = const()[name = tensor("op_3936_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_3936_end_mask_0 = const()[name = tensor("op_3936_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_3936_cast_fp16 = slice_by_index(begin = var_3936_begin_0, end = var_3936_end_0, end_mask = var_3936_end_mask_0, x = x_427_cast_fp16)[name = tensor("op_3936_cast_fp16")]; tensor var_3937 = const()[name = tensor("op_3937"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_65_cast_fp16 = reshape(shape = var_3937, x = var_3936_cast_fp16)[name = tensor("matrix_bd_65_cast_fp16")]; tensor matrix_ac_33_transpose_x_0 = const()[name = tensor("matrix_ac_33_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_33_transpose_y_0 = const()[name = tensor("matrix_ac_33_transpose_y_0"), val = tensor(false)]; tensor transpose_128_perm_0 = const()[name = tensor("transpose_128_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_129_perm_0 = const()[name = tensor("transpose_129_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_129 = transpose(perm = transpose_129_perm_0, x = k_65_cast_fp16)[name = tensor("transpose_216")]; tensor transpose_128 = transpose(perm = transpose_128_perm_0, x = var_3920_cast_fp16)[name = tensor("transpose_217")]; tensor matrix_ac_33_cast_fp16 = matmul(transpose_x = matrix_ac_33_transpose_x_0, transpose_y = matrix_ac_33_transpose_y_0, x = transpose_128, y = transpose_129)[name = tensor("matrix_ac_33_cast_fp16")]; tensor matrix_bd_67_begin_0 = const()[name = tensor("matrix_bd_67_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_67_end_0 = const()[name = tensor("matrix_bd_67_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_67_end_mask_0 = const()[name = tensor("matrix_bd_67_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_67_cast_fp16 = slice_by_index(begin = matrix_bd_67_begin_0, end = matrix_bd_67_end_0, end_mask = matrix_bd_67_end_mask_0, x = matrix_bd_65_cast_fp16)[name = tensor("matrix_bd_67_cast_fp16")]; tensor var_3946_cast_fp16 = add(x = matrix_ac_33_cast_fp16, y = matrix_bd_67_cast_fp16)[name = tensor("op_3946_cast_fp16")]; tensor _inversed_scores_65_y_0_to_fp16 = const()[name = tensor("_inversed_scores_65_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_65_cast_fp16 = mul(x = var_3946_cast_fp16, y = _inversed_scores_65_y_0_to_fp16)[name = tensor("_inversed_scores_65_cast_fp16")]; tensor scores_67_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_65_cast_fp16, cond = mask_11)[name = tensor("scores_67_cast_fp16")]; tensor var_3952_cast_fp16 = softmax(axis = var_59, x = scores_67_cast_fp16)[name = tensor("op_3952_cast_fp16")]; tensor input_873_cast_fp16 = select(a = var_44_to_fp16, b = var_3952_cast_fp16, cond = mask_11)[name = tensor("input_873_cast_fp16")]; tensor x_429_transpose_x_0 = const()[name = tensor("x_429_transpose_x_0"), val = tensor(false)]; tensor x_429_transpose_y_0 = const()[name = tensor("x_429_transpose_y_0"), val = tensor(false)]; tensor value_41_cast_fp16 = transpose(perm = value_41_perm_0, x = v_33_cast_fp16)[name = tensor("transpose_215")]; tensor x_429_cast_fp16 = matmul(transpose_x = x_429_transpose_x_0, transpose_y = x_429_transpose_y_0, x = input_873_cast_fp16, y = value_41_cast_fp16)[name = tensor("x_429_cast_fp16")]; tensor var_3956_perm_0 = const()[name = tensor("op_3956_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3957 = const()[name = tensor("op_3957"), val = tensor([1, -1, 1024])]; tensor var_3956_cast_fp16 = transpose(perm = var_3956_perm_0, x = x_429_cast_fp16)[name = tensor("transpose_214")]; tensor input_875_cast_fp16 = reshape(shape = var_3957, x = var_3956_cast_fp16)[name = tensor("input_875_cast_fp16")]; tensor encoder_layers_16_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(331680256))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(332466752))), name = tensor("encoder_layers_16_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_16_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(332466944)))]; tensor linear_151_cast_fp16 = linear(bias = encoder_layers_16_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_16_self_attn_linear_out_weight_to_fp16_palettized, x = input_875_cast_fp16)[name = tensor("linear_151_cast_fp16")]; tensor input_879_cast_fp16 = add(x = input_869_cast_fp16, y = linear_151_cast_fp16)[name = tensor("input_879_cast_fp16")]; tensor x_433_axes_0 = const()[name = tensor("x_433_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(332469056)))]; tensor encoder_layers_16_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(332471168)))]; tensor x_433_cast_fp16 = layer_norm(axes = x_433_axes_0, beta = encoder_layers_16_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_16_norm_conv_weight_to_fp16, x = input_879_cast_fp16)[name = tensor("x_433_cast_fp16")]; tensor input_881_perm_0 = const()[name = tensor("input_881_perm_0"), val = tensor([0, 2, 1])]; tensor input_883_pad_type_0 = const()[name = tensor("input_883_pad_type_0"), val = tensor("valid")]; tensor input_883_strides_0 = const()[name = tensor("input_883_strides_0"), val = tensor([1])]; tensor input_883_pad_0 = const()[name = tensor("input_883_pad_0"), val = tensor([0, 0])]; tensor input_883_dilations_0 = const()[name = tensor("input_883_dilations_0"), val = tensor([1])]; tensor input_883_groups_0 = const()[name = tensor("input_883_groups_0"), val = tensor(1)]; tensor encoder_layers_16_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_16_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(332473280))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(334570496))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_881_cast_fp16 = transpose(perm = input_881_perm_0, x = x_433_cast_fp16)[name = tensor("transpose_213")]; tensor input_883_cast_fp16 = conv(dilations = input_883_dilations_0, groups = input_883_groups_0, pad = input_883_pad_0, pad_type = input_883_pad_type_0, strides = input_883_strides_0, weight = encoder_layers_16_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_881_cast_fp16)[name = tensor("input_883_cast_fp16")]; tensor x_435_split_num_splits_0 = const()[name = tensor("x_435_split_num_splits_0"), val = tensor(2)]; tensor x_435_split_axis_0 = const()[name = tensor("x_435_split_axis_0"), val = tensor(1)]; tensor x_435_split_cast_fp16_0, tensor x_435_split_cast_fp16_1 = split(axis = x_435_split_axis_0, num_splits = x_435_split_num_splits_0, x = input_883_cast_fp16)[name = tensor("x_435_split_cast_fp16")]; tensor x_435_split_1_sigmoid_cast_fp16 = sigmoid(x = x_435_split_cast_fp16_1)[name = tensor("x_435_split_1_sigmoid_cast_fp16")]; tensor x_435_cast_fp16 = mul(x = x_435_split_cast_fp16_0, y = x_435_split_1_sigmoid_cast_fp16)[name = tensor("x_435_cast_fp16")]; tensor input_885_cast_fp16 = select(a = var_44_to_fp16, b = x_435_cast_fp16, cond = var_575)[name = tensor("input_885_cast_fp16")]; tensor new_x_67_interleave_0 = const()[name = tensor("new_x_67_interleave_0"), val = tensor(false)]; tensor new_x_67_cast_fp16 = concat(axis = var_59, interleave = new_x_67_interleave_0, values = (cache_67_cast_fp16, input_885_cast_fp16))[name = tensor("new_x_67_cast_fp16")]; tensor var_3996_begin_0 = const()[name = tensor("op_3996_begin_0"), val = tensor([0, 0, 7])]; tensor var_3996_end_0 = const()[name = tensor("op_3996_end_0"), val = tensor([1, 1024, 15])]; tensor var_3996_end_mask_0 = const()[name = tensor("op_3996_end_mask_0"), val = tensor([true, true, true])]; tensor var_3996_cast_fp16 = slice_by_index(begin = var_3996_begin_0, end = var_3996_end_0, end_mask = var_3996_end_mask_0, x = new_x_67_cast_fp16)[name = tensor("op_3996_cast_fp16")]; tensor x_437_pad_type_0 = const()[name = tensor("x_437_pad_type_0"), val = tensor("valid")]; tensor x_437_groups_0 = const()[name = tensor("x_437_groups_0"), val = tensor(1024)]; tensor x_437_strides_0 = const()[name = tensor("x_437_strides_0"), val = tensor([1])]; tensor x_437_pad_0 = const()[name = tensor("x_437_pad_0"), val = tensor([0, 0])]; tensor x_437_dilations_0 = const()[name = tensor("x_437_dilations_0"), val = tensor([1])]; tensor encoder_layers_16_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_16_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(334574656))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(334583936))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_437_cast_fp16 = conv(dilations = x_437_dilations_0, groups = x_437_groups_0, pad = x_437_pad_0, pad_type = x_437_pad_type_0, strides = x_437_strides_0, weight = encoder_layers_16_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_67_cast_fp16)[name = tensor("x_437_cast_fp16")]; tensor input_887_perm_0 = const()[name = tensor("input_887_perm_0"), val = tensor([0, 2, 1])]; tensor x_439_axes_0 = const()[name = tensor("x_439_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_16_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(334586048)))]; tensor encoder_layers_16_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_16_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(334588160)))]; tensor input_887_cast_fp16 = transpose(perm = input_887_perm_0, x = x_437_cast_fp16)[name = tensor("transpose_212")]; tensor x_439_cast_fp16 = layer_norm(axes = x_439_axes_0, beta = encoder_layers_16_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_16_conv_batch_norm_weight_to_fp16, x = input_887_cast_fp16)[name = tensor("x_439_cast_fp16")]; tensor input_889_perm_0 = const()[name = tensor("input_889_perm_0"), val = tensor([0, 2, 1])]; tensor input_889_cast_fp16 = transpose(perm = input_889_perm_0, x = x_439_cast_fp16)[name = tensor("transpose_211")]; tensor input_891_cast_fp16 = silu(x = input_889_cast_fp16)[name = tensor("input_891_cast_fp16")]; tensor x_441_pad_type_0 = const()[name = tensor("x_441_pad_type_0"), val = tensor("valid")]; tensor x_441_strides_0 = const()[name = tensor("x_441_strides_0"), val = tensor([1])]; tensor x_441_pad_0 = const()[name = tensor("x_441_pad_0"), val = tensor([0, 0])]; tensor x_441_dilations_0 = const()[name = tensor("x_441_dilations_0"), val = tensor([1])]; tensor x_441_groups_0 = const()[name = tensor("x_441_groups_0"), val = tensor(1)]; tensor encoder_layers_16_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_16_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(334590272))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335638912))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_441_cast_fp16 = conv(dilations = x_441_dilations_0, groups = x_441_groups_0, pad = x_441_pad_0, pad_type = x_441_pad_type_0, strides = x_441_strides_0, weight = encoder_layers_16_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_891_cast_fp16)[name = tensor("x_441_cast_fp16")]; tensor input_893_perm_0 = const()[name = tensor("input_893_perm_0"), val = tensor([0, 2, 1])]; tensor input_893_cast_fp16 = transpose(perm = input_893_perm_0, x = x_441_cast_fp16)[name = tensor("transpose_210")]; tensor input_895_cast_fp16 = add(x = input_879_cast_fp16, y = input_893_cast_fp16)[name = tensor("input_895_cast_fp16")]; tensor input_897_axes_0 = const()[name = tensor("input_897_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335641024)))]; tensor encoder_layers_16_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335643136)))]; tensor input_897_cast_fp16 = layer_norm(axes = input_897_axes_0, beta = encoder_layers_16_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_16_norm_feed_forward2_weight_to_fp16, x = input_895_cast_fp16)[name = tensor("input_897_cast_fp16")]; tensor encoder_layers_16_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335645248))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(338791040))), name = tensor("encoder_layers_16_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_16_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_16_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(338791232)))]; tensor linear_152_cast_fp16 = linear(bias = encoder_layers_16_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_16_feed_forward2_linear1_weight_to_fp16_palettized, x = input_897_cast_fp16)[name = tensor("linear_152_cast_fp16")]; tensor input_901_cast_fp16 = silu(x = linear_152_cast_fp16)[name = tensor("input_901_cast_fp16")]; tensor encoder_layers_16_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(338799488))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341945280))), name = tensor("encoder_layers_16_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_16_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_16_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341945472)))]; tensor linear_153_cast_fp16 = linear(bias = encoder_layers_16_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_16_feed_forward2_linear2_weight_to_fp16_palettized, x = input_901_cast_fp16)[name = tensor("linear_153_cast_fp16")]; tensor var_4039_to_fp16 = const()[name = tensor("op_4039_to_fp16"), val = tensor(0x1p-1)]; tensor var_4040_cast_fp16 = mul(x = linear_153_cast_fp16, y = var_4039_to_fp16)[name = tensor("op_4040_cast_fp16")]; tensor input_907_cast_fp16 = add(x = input_895_cast_fp16, y = var_4040_cast_fp16)[name = tensor("input_907_cast_fp16")]; tensor input_909_axes_0 = const()[name = tensor("input_909_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341947584)))]; tensor encoder_layers_16_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341949696)))]; tensor input_909_cast_fp16 = layer_norm(axes = input_909_axes_0, beta = encoder_layers_16_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_16_norm_out_weight_to_fp16, x = input_907_cast_fp16)[name = tensor("input_909_cast_fp16")]; tensor cache_69_begin_0 = const()[name = tensor("cache_69_begin_0"), val = tensor([17, 0, 0, 0])]; tensor cache_69_end_0 = const()[name = tensor("cache_69_end_0"), val = tensor([18, 1, 42, 1024])]; tensor cache_69_end_mask_0 = const()[name = tensor("cache_69_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_69_squeeze_mask_0 = const()[name = tensor("cache_69_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_69_cast_fp16 = slice_by_index(begin = cache_69_begin_0, end = cache_69_end_0, end_mask = cache_69_end_mask_0, squeeze_mask = cache_69_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_69_cast_fp16")]; tensor cache_71_begin_0 = const()[name = tensor("cache_71_begin_0"), val = tensor([17, 0, 0, 0])]; tensor cache_71_end_0 = const()[name = tensor("cache_71_end_0"), val = tensor([18, 1, 1024, 8])]; tensor cache_71_end_mask_0 = const()[name = tensor("cache_71_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_71_squeeze_mask_0 = const()[name = tensor("cache_71_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_71_cast_fp16 = slice_by_index(begin = cache_71_begin_0, end = cache_71_end_0, end_mask = cache_71_end_mask_0, squeeze_mask = cache_71_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_71_cast_fp16")]; tensor input_911_axes_0 = const()[name = tensor("input_911_axes_0"), val = tensor([-1])]; tensor encoder_layers_17_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_17_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341951808)))]; tensor encoder_layers_17_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_17_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341953920)))]; tensor input_911_cast_fp16 = layer_norm(axes = input_911_axes_0, beta = encoder_layers_17_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_17_norm_feed_forward1_weight_to_fp16, x = input_909_cast_fp16)[name = tensor("input_911_cast_fp16")]; tensor encoder_layers_17_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341956032))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345101824))), name = tensor("encoder_layers_17_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_17_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_17_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345102016)))]; tensor linear_154_cast_fp16 = linear(bias = encoder_layers_17_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_17_feed_forward1_linear1_weight_to_fp16_palettized, x = input_911_cast_fp16)[name = tensor("linear_154_cast_fp16")]; tensor input_915_cast_fp16 = silu(x = linear_154_cast_fp16)[name = tensor("input_915_cast_fp16")]; tensor encoder_layers_17_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345110272))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(348256064))), name = tensor("encoder_layers_17_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_17_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_17_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(348256256)))]; tensor linear_155_cast_fp16 = linear(bias = encoder_layers_17_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_17_feed_forward1_linear2_weight_to_fp16_palettized, x = input_915_cast_fp16)[name = tensor("linear_155_cast_fp16")]; tensor var_4076_to_fp16 = const()[name = tensor("op_4076_to_fp16"), val = tensor(0x1p-1)]; tensor var_4077_cast_fp16 = mul(x = linear_155_cast_fp16, y = var_4076_to_fp16)[name = tensor("op_4077_cast_fp16")]; tensor input_921_cast_fp16 = add(x = input_909_cast_fp16, y = var_4077_cast_fp16)[name = tensor("input_921_cast_fp16")]; tensor key_35_axes_0 = const()[name = tensor("key_35_axes_0"), val = tensor([-1])]; tensor encoder_layers_17_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_17_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(348258368)))]; tensor encoder_layers_17_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_17_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(348260480)))]; tensor key_35_cast_fp16 = layer_norm(axes = key_35_axes_0, beta = encoder_layers_17_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_17_norm_self_att_weight_to_fp16, x = input_921_cast_fp16)[name = tensor("key_35_cast_fp16")]; tensor input_923_interleave_0 = const()[name = tensor("input_923_interleave_0"), val = tensor(false)]; tensor input_923_cast_fp16 = concat(axis = var_68, interleave = input_923_interleave_0, values = (cache_69_cast_fp16, key_35_cast_fp16))[name = tensor("input_923_cast_fp16")]; tensor var_4099_begin_0 = const()[name = tensor("op_4099_begin_0"), val = tensor([0, 7, 0])]; tensor var_4099_end_0 = const()[name = tensor("op_4099_end_0"), val = tensor([1, 42, 1024])]; tensor var_4099_end_mask_0 = const()[name = tensor("op_4099_end_mask_0"), val = tensor([true, true, true])]; tensor var_4099_cast_fp16 = slice_by_index(begin = var_4099_begin_0, end = var_4099_end_0, end_mask = var_4099_end_mask_0, x = cache_69_cast_fp16)[name = tensor("op_4099_cast_fp16")]; tensor var_4105_interleave_0 = const()[name = tensor("op_4105_interleave_0"), val = tensor(false)]; tensor var_4105_cast_fp16 = concat(axis = var_68, interleave = var_4105_interleave_0, values = (var_4099_cast_fp16, key_35_cast_fp16))[name = tensor("op_4105_cast_fp16")]; tensor encoder_layers_17_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(348262592))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(349049088))), name = tensor("encoder_layers_17_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_17_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(349049280)))]; tensor linear_156_cast_fp16 = linear(bias = encoder_layers_17_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_17_self_attn_linear_q_weight_to_fp16_palettized, x = key_35_cast_fp16)[name = tensor("linear_156_cast_fp16")]; tensor var_4110 = const()[name = tensor("op_4110"), val = tensor([1, -1, 8, 128])]; tensor q_103_cast_fp16 = reshape(shape = var_4110, x = linear_156_cast_fp16)[name = tensor("q_103_cast_fp16")]; tensor encoder_layers_17_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(349051392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(349837888))), name = tensor("encoder_layers_17_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_17_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(349838080)))]; tensor linear_157_cast_fp16 = linear(bias = encoder_layers_17_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_17_self_attn_linear_k_weight_to_fp16_palettized, x = input_923_cast_fp16)[name = tensor("linear_157_cast_fp16")]; tensor var_4115 = const()[name = tensor("op_4115"), val = tensor([1, -1, 8, 128])]; tensor k_69_cast_fp16 = reshape(shape = var_4115, x = linear_157_cast_fp16)[name = tensor("k_69_cast_fp16")]; tensor encoder_layers_17_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(349840192))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350626688))), name = tensor("encoder_layers_17_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_17_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350626880)))]; tensor linear_158_cast_fp16 = linear(bias = encoder_layers_17_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_17_self_attn_linear_v_weight_to_fp16_palettized, x = input_923_cast_fp16)[name = tensor("linear_158_cast_fp16")]; tensor var_4120 = const()[name = tensor("op_4120"), val = tensor([1, -1, 8, 128])]; tensor v_35_cast_fp16 = reshape(shape = var_4120, x = linear_158_cast_fp16)[name = tensor("v_35_cast_fp16")]; tensor value_43_perm_0 = const()[name = tensor("value_43_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_17_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350628992)))]; tensor var_4133_cast_fp16 = add(x = q_103_cast_fp16, y = encoder_layers_17_self_attn_pos_bias_u_to_fp16)[name = tensor("op_4133_cast_fp16")]; tensor encoder_layers_17_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350631104)))]; tensor var_4135_cast_fp16 = add(x = q_103_cast_fp16, y = encoder_layers_17_self_attn_pos_bias_v_to_fp16)[name = tensor("op_4135_cast_fp16")]; tensor q_with_bias_v_35_perm_0 = const()[name = tensor("q_with_bias_v_35_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_449_transpose_x_0 = const()[name = tensor("x_449_transpose_x_0"), val = tensor(false)]; tensor x_449_transpose_y_0 = const()[name = tensor("x_449_transpose_y_0"), val = tensor(false)]; tensor op_4137_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_4137_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350633216))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350732800))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350732608)))]; tensor q_with_bias_v_35_cast_fp16 = transpose(perm = q_with_bias_v_35_perm_0, x = var_4135_cast_fp16)[name = tensor("transpose_209")]; tensor x_449_cast_fp16 = matmul(transpose_x = x_449_transpose_x_0, transpose_y = x_449_transpose_y_0, x = q_with_bias_v_35_cast_fp16, y = op_4137_to_fp16_quantized)[name = tensor("x_449_cast_fp16")]; tensor x_451_pad_0 = const()[name = tensor("x_451_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_451_mode_0 = const()[name = tensor("x_451_mode_0"), val = tensor("constant")]; tensor const_300_to_fp16 = const()[name = tensor("const_300_to_fp16"), val = tensor(0x0p+0)]; tensor x_451_cast_fp16 = pad(constant_val = const_300_to_fp16, mode = x_451_mode_0, pad = x_451_pad_0, x = x_449_cast_fp16)[name = tensor("x_451_cast_fp16")]; tensor var_4145 = const()[name = tensor("op_4145"), val = tensor([1, 8, -1, 7])]; tensor x_453_cast_fp16 = reshape(shape = var_4145, x = x_451_cast_fp16)[name = tensor("x_453_cast_fp16")]; tensor var_4149_begin_0 = const()[name = tensor("op_4149_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_4149_end_0 = const()[name = tensor("op_4149_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_4149_end_mask_0 = const()[name = tensor("op_4149_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_4149_cast_fp16 = slice_by_index(begin = var_4149_begin_0, end = var_4149_end_0, end_mask = var_4149_end_mask_0, x = x_453_cast_fp16)[name = tensor("op_4149_cast_fp16")]; tensor var_4150 = const()[name = tensor("op_4150"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_69_cast_fp16 = reshape(shape = var_4150, x = var_4149_cast_fp16)[name = tensor("matrix_bd_69_cast_fp16")]; tensor matrix_ac_35_transpose_x_0 = const()[name = tensor("matrix_ac_35_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_35_transpose_y_0 = const()[name = tensor("matrix_ac_35_transpose_y_0"), val = tensor(false)]; tensor transpose_130_perm_0 = const()[name = tensor("transpose_130_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_131_perm_0 = const()[name = tensor("transpose_131_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_131 = transpose(perm = transpose_131_perm_0, x = k_69_cast_fp16)[name = tensor("transpose_207")]; tensor transpose_130 = transpose(perm = transpose_130_perm_0, x = var_4133_cast_fp16)[name = tensor("transpose_208")]; tensor matrix_ac_35_cast_fp16 = matmul(transpose_x = matrix_ac_35_transpose_x_0, transpose_y = matrix_ac_35_transpose_y_0, x = transpose_130, y = transpose_131)[name = tensor("matrix_ac_35_cast_fp16")]; tensor matrix_bd_71_begin_0 = const()[name = tensor("matrix_bd_71_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_71_end_0 = const()[name = tensor("matrix_bd_71_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_71_end_mask_0 = const()[name = tensor("matrix_bd_71_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_71_cast_fp16 = slice_by_index(begin = matrix_bd_71_begin_0, end = matrix_bd_71_end_0, end_mask = matrix_bd_71_end_mask_0, x = matrix_bd_69_cast_fp16)[name = tensor("matrix_bd_71_cast_fp16")]; tensor var_4159_cast_fp16 = add(x = matrix_ac_35_cast_fp16, y = matrix_bd_71_cast_fp16)[name = tensor("op_4159_cast_fp16")]; tensor _inversed_scores_69_y_0_to_fp16 = const()[name = tensor("_inversed_scores_69_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_69_cast_fp16 = mul(x = var_4159_cast_fp16, y = _inversed_scores_69_y_0_to_fp16)[name = tensor("_inversed_scores_69_cast_fp16")]; tensor scores_71_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_69_cast_fp16, cond = mask_11)[name = tensor("scores_71_cast_fp16")]; tensor var_4165_cast_fp16 = softmax(axis = var_59, x = scores_71_cast_fp16)[name = tensor("op_4165_cast_fp16")]; tensor input_925_cast_fp16 = select(a = var_44_to_fp16, b = var_4165_cast_fp16, cond = mask_11)[name = tensor("input_925_cast_fp16")]; tensor x_455_transpose_x_0 = const()[name = tensor("x_455_transpose_x_0"), val = tensor(false)]; tensor x_455_transpose_y_0 = const()[name = tensor("x_455_transpose_y_0"), val = tensor(false)]; tensor value_43_cast_fp16 = transpose(perm = value_43_perm_0, x = v_35_cast_fp16)[name = tensor("transpose_206")]; tensor x_455_cast_fp16 = matmul(transpose_x = x_455_transpose_x_0, transpose_y = x_455_transpose_y_0, x = input_925_cast_fp16, y = value_43_cast_fp16)[name = tensor("x_455_cast_fp16")]; tensor var_4169_perm_0 = const()[name = tensor("op_4169_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4170 = const()[name = tensor("op_4170"), val = tensor([1, -1, 1024])]; tensor var_4169_cast_fp16 = transpose(perm = var_4169_perm_0, x = x_455_cast_fp16)[name = tensor("transpose_205")]; tensor input_927_cast_fp16 = reshape(shape = var_4170, x = var_4169_cast_fp16)[name = tensor("input_927_cast_fp16")]; tensor encoder_layers_17_self_attn_linear_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350733120))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(351519616))), name = tensor("encoder_layers_17_self_attn_linear_out_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_17_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(351519808)))]; tensor linear_160_cast_fp16 = linear(bias = encoder_layers_17_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_17_self_attn_linear_out_weight_to_fp16_palettized, x = input_927_cast_fp16)[name = tensor("linear_160_cast_fp16")]; tensor input_931_cast_fp16 = add(x = input_921_cast_fp16, y = linear_160_cast_fp16)[name = tensor("input_931_cast_fp16")]; tensor x_459_axes_0 = const()[name = tensor("x_459_axes_0"), val = tensor([-1])]; tensor encoder_layers_17_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_17_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(351521920)))]; tensor encoder_layers_17_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_17_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(351524032)))]; tensor x_459_cast_fp16 = layer_norm(axes = x_459_axes_0, beta = encoder_layers_17_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_17_norm_conv_weight_to_fp16, x = input_931_cast_fp16)[name = tensor("x_459_cast_fp16")]; tensor input_933_perm_0 = const()[name = tensor("input_933_perm_0"), val = tensor([0, 2, 1])]; tensor input_935_pad_type_0 = const()[name = tensor("input_935_pad_type_0"), val = tensor("valid")]; tensor input_935_strides_0 = const()[name = tensor("input_935_strides_0"), val = tensor([1])]; tensor input_935_pad_0 = const()[name = tensor("input_935_pad_0"), val = tensor([0, 0])]; tensor input_935_dilations_0 = const()[name = tensor("input_935_dilations_0"), val = tensor([1])]; tensor input_935_groups_0 = const()[name = tensor("input_935_groups_0"), val = tensor(1)]; tensor encoder_layers_17_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_17_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(351526144))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353623360))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_933_cast_fp16 = transpose(perm = input_933_perm_0, x = x_459_cast_fp16)[name = tensor("transpose_204")]; tensor input_935_cast_fp16 = conv(dilations = input_935_dilations_0, groups = input_935_groups_0, pad = input_935_pad_0, pad_type = input_935_pad_type_0, strides = input_935_strides_0, weight = encoder_layers_17_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_933_cast_fp16)[name = tensor("input_935_cast_fp16")]; tensor x_461_split_num_splits_0 = const()[name = tensor("x_461_split_num_splits_0"), val = tensor(2)]; tensor x_461_split_axis_0 = const()[name = tensor("x_461_split_axis_0"), val = tensor(1)]; tensor x_461_split_cast_fp16_0, tensor x_461_split_cast_fp16_1 = split(axis = x_461_split_axis_0, num_splits = x_461_split_num_splits_0, x = input_935_cast_fp16)[name = tensor("x_461_split_cast_fp16")]; tensor x_461_split_1_sigmoid_cast_fp16 = sigmoid(x = x_461_split_cast_fp16_1)[name = tensor("x_461_split_1_sigmoid_cast_fp16")]; tensor x_461_cast_fp16 = mul(x = x_461_split_cast_fp16_0, y = x_461_split_1_sigmoid_cast_fp16)[name = tensor("x_461_cast_fp16")]; tensor input_937_cast_fp16 = select(a = var_44_to_fp16, b = x_461_cast_fp16, cond = var_575)[name = tensor("input_937_cast_fp16")]; tensor new_x_71_interleave_0 = const()[name = tensor("new_x_71_interleave_0"), val = tensor(false)]; tensor new_x_71_cast_fp16 = concat(axis = var_59, interleave = new_x_71_interleave_0, values = (cache_71_cast_fp16, input_937_cast_fp16))[name = tensor("new_x_71_cast_fp16")]; tensor var_4209_begin_0 = const()[name = tensor("op_4209_begin_0"), val = tensor([0, 0, 7])]; tensor var_4209_end_0 = const()[name = tensor("op_4209_end_0"), val = tensor([1, 1024, 15])]; tensor var_4209_end_mask_0 = const()[name = tensor("op_4209_end_mask_0"), val = tensor([true, true, true])]; tensor var_4209_cast_fp16 = slice_by_index(begin = var_4209_begin_0, end = var_4209_end_0, end_mask = var_4209_end_mask_0, x = new_x_71_cast_fp16)[name = tensor("op_4209_cast_fp16")]; tensor x_463_pad_type_0 = const()[name = tensor("x_463_pad_type_0"), val = tensor("valid")]; tensor x_463_groups_0 = const()[name = tensor("x_463_groups_0"), val = tensor(1024)]; tensor x_463_strides_0 = const()[name = tensor("x_463_strides_0"), val = tensor([1])]; tensor x_463_pad_0 = const()[name = tensor("x_463_pad_0"), val = tensor([0, 0])]; tensor x_463_dilations_0 = const()[name = tensor("x_463_dilations_0"), val = tensor([1])]; tensor encoder_layers_17_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_17_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353627520))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353636800))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_463_cast_fp16 = conv(dilations = x_463_dilations_0, groups = x_463_groups_0, pad = x_463_pad_0, pad_type = x_463_pad_type_0, strides = x_463_strides_0, weight = encoder_layers_17_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_71_cast_fp16)[name = tensor("x_463_cast_fp16")]; tensor input_939_perm_0 = const()[name = tensor("input_939_perm_0"), val = tensor([0, 2, 1])]; tensor x_465_axes_0 = const()[name = tensor("x_465_axes_0"), val = tensor([-1])]; tensor encoder_layers_17_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_17_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353638912)))]; tensor encoder_layers_17_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_17_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353641024)))]; tensor input_939_cast_fp16 = transpose(perm = input_939_perm_0, x = x_463_cast_fp16)[name = tensor("transpose_203")]; tensor x_465_cast_fp16 = layer_norm(axes = x_465_axes_0, beta = encoder_layers_17_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_17_conv_batch_norm_weight_to_fp16, x = input_939_cast_fp16)[name = tensor("x_465_cast_fp16")]; tensor input_941_perm_0 = const()[name = tensor("input_941_perm_0"), val = tensor([0, 2, 1])]; tensor input_941_cast_fp16 = transpose(perm = input_941_perm_0, x = x_465_cast_fp16)[name = tensor("transpose_202")]; tensor input_943_cast_fp16 = silu(x = input_941_cast_fp16)[name = tensor("input_943_cast_fp16")]; tensor x_467_pad_type_0 = const()[name = tensor("x_467_pad_type_0"), val = tensor("valid")]; tensor x_467_strides_0 = const()[name = tensor("x_467_strides_0"), val = tensor([1])]; tensor x_467_pad_0 = const()[name = tensor("x_467_pad_0"), val = tensor([0, 0])]; tensor x_467_dilations_0 = const()[name = tensor("x_467_dilations_0"), val = tensor([1])]; tensor x_467_groups_0 = const()[name = tensor("x_467_groups_0"), val = tensor(1)]; tensor encoder_layers_17_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_17_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353643136))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354691776))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_467_cast_fp16 = conv(dilations = x_467_dilations_0, groups = x_467_groups_0, pad = x_467_pad_0, pad_type = x_467_pad_type_0, strides = x_467_strides_0, weight = encoder_layers_17_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_943_cast_fp16)[name = tensor("x_467_cast_fp16")]; tensor input_945_perm_0 = const()[name = tensor("input_945_perm_0"), val = tensor([0, 2, 1])]; tensor input_945_cast_fp16 = transpose(perm = input_945_perm_0, x = x_467_cast_fp16)[name = tensor("transpose_201")]; tensor input_947_cast_fp16 = add(x = input_931_cast_fp16, y = input_945_cast_fp16)[name = tensor("input_947_cast_fp16")]; tensor input_949_axes_0 = const()[name = tensor("input_949_axes_0"), val = tensor([-1])]; tensor encoder_layers_17_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_17_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354693888)))]; tensor encoder_layers_17_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_17_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354696000)))]; tensor input_949_cast_fp16 = layer_norm(axes = input_949_axes_0, beta = encoder_layers_17_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_17_norm_feed_forward2_weight_to_fp16, x = input_947_cast_fp16)[name = tensor("input_949_cast_fp16")]; tensor encoder_layers_17_feed_forward2_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354698112))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(357843904))), name = tensor("encoder_layers_17_feed_forward2_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_17_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_17_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(357844096)))]; tensor linear_161_cast_fp16 = linear(bias = encoder_layers_17_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_17_feed_forward2_linear1_weight_to_fp16_palettized, x = input_949_cast_fp16)[name = tensor("linear_161_cast_fp16")]; tensor input_953_cast_fp16 = silu(x = linear_161_cast_fp16)[name = tensor("input_953_cast_fp16")]; tensor encoder_layers_17_feed_forward2_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(357852352))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(360998144))), name = tensor("encoder_layers_17_feed_forward2_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_17_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_17_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(360998336)))]; tensor linear_162_cast_fp16 = linear(bias = encoder_layers_17_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_17_feed_forward2_linear2_weight_to_fp16_palettized, x = input_953_cast_fp16)[name = tensor("linear_162_cast_fp16")]; tensor var_4252_to_fp16 = const()[name = tensor("op_4252_to_fp16"), val = tensor(0x1p-1)]; tensor var_4253_cast_fp16 = mul(x = linear_162_cast_fp16, y = var_4252_to_fp16)[name = tensor("op_4253_cast_fp16")]; tensor input_959_cast_fp16 = add(x = input_947_cast_fp16, y = var_4253_cast_fp16)[name = tensor("input_959_cast_fp16")]; tensor input_961_axes_0 = const()[name = tensor("input_961_axes_0"), val = tensor([-1])]; tensor encoder_layers_17_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_17_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361000448)))]; tensor encoder_layers_17_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_17_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361002560)))]; tensor input_961_cast_fp16 = layer_norm(axes = input_961_axes_0, beta = encoder_layers_17_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_17_norm_out_weight_to_fp16, x = input_959_cast_fp16)[name = tensor("input_961_cast_fp16")]; tensor cache_73_begin_0 = const()[name = tensor("cache_73_begin_0"), val = tensor([18, 0, 0, 0])]; tensor cache_73_end_0 = const()[name = tensor("cache_73_end_0"), val = tensor([19, 1, 42, 1024])]; tensor cache_73_end_mask_0 = const()[name = tensor("cache_73_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_73_squeeze_mask_0 = const()[name = tensor("cache_73_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_73_cast_fp16 = slice_by_index(begin = cache_73_begin_0, end = cache_73_end_0, end_mask = cache_73_end_mask_0, squeeze_mask = cache_73_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_73_cast_fp16")]; tensor cache_75_begin_0 = const()[name = tensor("cache_75_begin_0"), val = tensor([18, 0, 0, 0])]; tensor cache_75_end_0 = const()[name = tensor("cache_75_end_0"), val = tensor([19, 1, 1024, 8])]; tensor cache_75_end_mask_0 = const()[name = tensor("cache_75_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_75_squeeze_mask_0 = const()[name = tensor("cache_75_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_75_cast_fp16 = slice_by_index(begin = cache_75_begin_0, end = cache_75_end_0, end_mask = cache_75_end_mask_0, squeeze_mask = cache_75_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_75_cast_fp16")]; tensor input_963_axes_0 = const()[name = tensor("input_963_axes_0"), val = tensor([-1])]; tensor encoder_layers_18_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_18_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361004672)))]; tensor encoder_layers_18_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_18_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361006784)))]; tensor input_963_cast_fp16 = layer_norm(axes = input_963_axes_0, beta = encoder_layers_18_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_18_norm_feed_forward1_weight_to_fp16, x = input_961_cast_fp16)[name = tensor("input_963_cast_fp16")]; tensor encoder_layers_18_feed_forward1_linear1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361008896))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(364154688))), name = tensor("encoder_layers_18_feed_forward1_linear1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor encoder_layers_18_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_18_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(364154880)))]; tensor linear_163_cast_fp16 = linear(bias = encoder_layers_18_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_18_feed_forward1_linear1_weight_to_fp16_palettized, x = input_963_cast_fp16)[name = tensor("linear_163_cast_fp16")]; tensor input_967_cast_fp16 = silu(x = linear_163_cast_fp16)[name = tensor("input_967_cast_fp16")]; tensor encoder_layers_18_feed_forward1_linear2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(364163136))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(367308928))), name = tensor("encoder_layers_18_feed_forward1_linear2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor encoder_layers_18_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_18_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(367309120)))]; tensor linear_164_cast_fp16 = linear(bias = encoder_layers_18_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_18_feed_forward1_linear2_weight_to_fp16_palettized, x = input_967_cast_fp16)[name = tensor("linear_164_cast_fp16")]; tensor var_4289_to_fp16 = const()[name = tensor("op_4289_to_fp16"), val = tensor(0x1p-1)]; tensor var_4290_cast_fp16 = mul(x = linear_164_cast_fp16, y = var_4289_to_fp16)[name = tensor("op_4290_cast_fp16")]; tensor input_973_cast_fp16 = add(x = input_961_cast_fp16, y = var_4290_cast_fp16)[name = tensor("input_973_cast_fp16")]; tensor key_37_axes_0 = const()[name = tensor("key_37_axes_0"), val = tensor([-1])]; tensor encoder_layers_18_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_18_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(367311232)))]; tensor encoder_layers_18_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_18_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(367313344)))]; tensor key_37_cast_fp16 = layer_norm(axes = key_37_axes_0, beta = encoder_layers_18_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_18_norm_self_att_weight_to_fp16, x = input_973_cast_fp16)[name = tensor("key_37_cast_fp16")]; tensor input_975_interleave_0 = const()[name = tensor("input_975_interleave_0"), val = tensor(false)]; tensor input_975_cast_fp16 = concat(axis = var_68, interleave = input_975_interleave_0, values = (cache_73_cast_fp16, key_37_cast_fp16))[name = tensor("input_975_cast_fp16")]; tensor var_4312_begin_0 = const()[name = tensor("op_4312_begin_0"), val = tensor([0, 7, 0])]; tensor var_4312_end_0 = const()[name = tensor("op_4312_end_0"), val = tensor([1, 42, 1024])]; tensor var_4312_end_mask_0 = const()[name = tensor("op_4312_end_mask_0"), val = tensor([true, true, true])]; tensor var_4312_cast_fp16 = slice_by_index(begin = var_4312_begin_0, end = var_4312_end_0, end_mask = var_4312_end_mask_0, x = cache_73_cast_fp16)[name = tensor("op_4312_cast_fp16")]; tensor var_4318_interleave_0 = const()[name = tensor("op_4318_interleave_0"), val = tensor(false)]; tensor var_4318_cast_fp16 = concat(axis = var_68, interleave = var_4318_interleave_0, values = (var_4312_cast_fp16, key_37_cast_fp16))[name = tensor("op_4318_cast_fp16")]; tensor encoder_layers_18_self_attn_linear_q_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(367315456))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368101952))), name = tensor("encoder_layers_18_self_attn_linear_q_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_18_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368102144)))]; tensor linear_165_cast_fp16 = linear(bias = encoder_layers_18_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_18_self_attn_linear_q_weight_to_fp16_palettized, x = key_37_cast_fp16)[name = tensor("linear_165_cast_fp16")]; tensor var_4323 = const()[name = tensor("op_4323"), val = tensor([1, -1, 8, 128])]; tensor q_109_cast_fp16 = reshape(shape = var_4323, x = linear_165_cast_fp16)[name = tensor("q_109_cast_fp16")]; tensor encoder_layers_18_self_attn_linear_k_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368104256))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368890752))), name = tensor("encoder_layers_18_self_attn_linear_k_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_18_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368890944)))]; tensor linear_166_cast_fp16 = linear(bias = encoder_layers_18_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_18_self_attn_linear_k_weight_to_fp16_palettized, x = input_975_cast_fp16)[name = tensor("linear_166_cast_fp16")]; tensor var_4328 = const()[name = tensor("op_4328"), val = tensor([1, -1, 8, 128])]; tensor k_73_cast_fp16 = reshape(shape = var_4328, x = linear_166_cast_fp16)[name = tensor("k_73_cast_fp16")]; tensor encoder_layers_18_self_attn_linear_v_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368893056))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369679552))), name = tensor("encoder_layers_18_self_attn_linear_v_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor encoder_layers_18_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369679744)))]; tensor linear_167_cast_fp16 = linear(bias = encoder_layers_18_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_18_self_attn_linear_v_weight_to_fp16_palettized, x = input_975_cast_fp16)[name = tensor("linear_167_cast_fp16")]; tensor var_4333 = const()[name = tensor("op_4333"), val = tensor([1, -1, 8, 128])]; tensor v_37_cast_fp16 = reshape(shape = var_4333, x = linear_167_cast_fp16)[name = tensor("v_37_cast_fp16")]; tensor value_45_perm_0 = const()[name = tensor("value_45_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_18_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369681856)))]; tensor var_4346_cast_fp16 = add(x = q_109_cast_fp16, y = encoder_layers_18_self_attn_pos_bias_u_to_fp16)[name = tensor("op_4346_cast_fp16")]; tensor encoder_layers_18_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369683968)))]; tensor var_4348_cast_fp16 = add(x = q_109_cast_fp16, y = encoder_layers_18_self_attn_pos_bias_v_to_fp16)[name = tensor("op_4348_cast_fp16")]; tensor q_with_bias_v_37_perm_0 = const()[name = tensor("q_with_bias_v_37_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_475_transpose_x_0 = const()[name = tensor("x_475_transpose_x_0"), val = tensor(false)]; tensor x_475_transpose_y_0 = const()[name = tensor("x_475_transpose_y_0"), val = tensor(false)]; tensor op_4350_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_4350_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369686080))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369785664))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369785472)))]; tensor q_with_bias_v_37_cast_fp16 = transpose(perm = q_with_bias_v_37_perm_0, x = var_4348_cast_fp16)[name = tensor("transpose_200")]; tensor x_475_cast_fp16 = matmul(transpose_x = x_475_transpose_x_0, transpose_y = x_475_transpose_y_0, x = q_with_bias_v_37_cast_fp16, y = op_4350_to_fp16_quantized)[name = tensor("x_475_cast_fp16")]; tensor x_477_pad_0 = const()[name = tensor("x_477_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_477_mode_0 = const()[name = tensor("x_477_mode_0"), val = tensor("constant")]; tensor const_313_to_fp16 = const()[name = tensor("const_313_to_fp16"), val = tensor(0x0p+0)]; tensor x_477_cast_fp16 = pad(constant_val = const_313_to_fp16, mode = x_477_mode_0, pad = x_477_pad_0, x = x_475_cast_fp16)[name = tensor("x_477_cast_fp16")]; tensor var_4358 = const()[name = tensor("op_4358"), val = tensor([1, 8, -1, 7])]; tensor x_479_cast_fp16 = reshape(shape = var_4358, x = x_477_cast_fp16)[name = tensor("x_479_cast_fp16")]; tensor var_4362_begin_0 = const()[name = tensor("op_4362_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_4362_end_0 = const()[name = tensor("op_4362_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_4362_end_mask_0 = const()[name = tensor("op_4362_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_4362_cast_fp16 = slice_by_index(begin = var_4362_begin_0, end = var_4362_end_0, end_mask = var_4362_end_mask_0, x = x_479_cast_fp16)[name = tensor("op_4362_cast_fp16")]; tensor var_4363 = const()[name = tensor("op_4363"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_73_cast_fp16 = reshape(shape = var_4363, x = var_4362_cast_fp16)[name = tensor("matrix_bd_73_cast_fp16")]; tensor matrix_ac_37_transpose_x_0 = const()[name = tensor("matrix_ac_37_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_37_transpose_y_0 = const()[name = tensor("matrix_ac_37_transpose_y_0"), val = tensor(false)]; tensor transpose_132_perm_0 = const()[name = tensor("transpose_132_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_133_perm_0 = const()[name = tensor("transpose_133_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_133 = transpose(perm = transpose_133_perm_0, x = k_73_cast_fp16)[name = tensor("transpose_198")]; tensor transpose_132 = transpose(perm = transpose_132_perm_0, x = var_4346_cast_fp16)[name = tensor("transpose_199")]; tensor matrix_ac_37_cast_fp16 = matmul(transpose_x = matrix_ac_37_transpose_x_0, transpose_y = matrix_ac_37_transpose_y_0, x = transpose_132, y = transpose_133)[name = tensor("matrix_ac_37_cast_fp16")]; tensor matrix_bd_75_begin_0 = const()[name = tensor("matrix_bd_75_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_75_end_0 = const()[name = tensor("matrix_bd_75_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_75_end_mask_0 = const()[name = tensor("matrix_bd_75_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_75_cast_fp16 = slice_by_index(begin = matrix_bd_75_begin_0, end = matrix_bd_75_end_0, end_mask = matrix_bd_75_end_mask_0, x = matrix_bd_73_cast_fp16)[name = tensor("matrix_bd_75_cast_fp16")]; tensor var_4372_cast_fp16 = add(x = matrix_ac_37_cast_fp16, y = matrix_bd_75_cast_fp16)[name = tensor("op_4372_cast_fp16")]; tensor _inversed_scores_73_y_0_to_fp16 = const()[name = tensor("_inversed_scores_73_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_73_cast_fp16 = mul(x = var_4372_cast_fp16, y = _inversed_scores_73_y_0_to_fp16)[name = tensor("_inversed_scores_73_cast_fp16")]; tensor scores_75_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_73_cast_fp16, cond = mask_11)[name = tensor("scores_75_cast_fp16")]; tensor var_4378_cast_fp16 = softmax(axis = var_59, x = scores_75_cast_fp16)[name = tensor("op_4378_cast_fp16")]; tensor input_977_cast_fp16 = select(a = var_44_to_fp16, b = var_4378_cast_fp16, cond = mask_11)[name = tensor("input_977_cast_fp16")]; tensor x_481_transpose_x_0 = const()[name = tensor("x_481_transpose_x_0"), val = tensor(false)]; tensor x_481_transpose_y_0 = const()[name = tensor("x_481_transpose_y_0"), val = tensor(false)]; tensor value_45_cast_fp16 = transpose(perm = value_45_perm_0, x = v_37_cast_fp16)[name = tensor("transpose_197")]; tensor x_481_cast_fp16 = matmul(transpose_x = x_481_transpose_x_0, transpose_y = x_481_transpose_y_0, x = input_977_cast_fp16, y = value_45_cast_fp16)[name = tensor("x_481_cast_fp16")]; tensor var_4382_perm_0 = const()[name = tensor("op_4382_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4383 = const()[name = tensor("op_4383"), val = tensor([1, -1, 1024])]; tensor var_4382_cast_fp16 = transpose(perm = var_4382_perm_0, x = x_481_cast_fp16)[name = tensor("transpose_196")]; tensor input_979_cast_fp16 = reshape(shape = var_4383, x = var_4382_cast_fp16)[name = tensor("input_979_cast_fp16")]; tensor encoder_layers_18_self_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_18_self_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369785984))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370834624))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_18_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370836736)))]; tensor linear_169_cast_fp16 = linear(bias = encoder_layers_18_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_18_self_attn_linear_out_weight_to_fp16_quantized, x = input_979_cast_fp16)[name = tensor("linear_169_cast_fp16")]; tensor input_983_cast_fp16 = add(x = input_973_cast_fp16, y = linear_169_cast_fp16)[name = tensor("input_983_cast_fp16")]; tensor x_485_axes_0 = const()[name = tensor("x_485_axes_0"), val = tensor([-1])]; tensor encoder_layers_18_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_18_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370838848)))]; tensor encoder_layers_18_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_18_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370840960)))]; tensor x_485_cast_fp16 = layer_norm(axes = x_485_axes_0, beta = encoder_layers_18_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_18_norm_conv_weight_to_fp16, x = input_983_cast_fp16)[name = tensor("x_485_cast_fp16")]; tensor input_985_perm_0 = const()[name = tensor("input_985_perm_0"), val = tensor([0, 2, 1])]; tensor input_987_pad_type_0 = const()[name = tensor("input_987_pad_type_0"), val = tensor("valid")]; tensor input_987_strides_0 = const()[name = tensor("input_987_strides_0"), val = tensor([1])]; tensor input_987_pad_0 = const()[name = tensor("input_987_pad_0"), val = tensor([0, 0])]; tensor input_987_dilations_0 = const()[name = tensor("input_987_dilations_0"), val = tensor([1])]; tensor input_987_groups_0 = const()[name = tensor("input_987_groups_0"), val = tensor(1)]; tensor encoder_layers_18_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_18_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370843072))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372940288))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_985_cast_fp16 = transpose(perm = input_985_perm_0, x = x_485_cast_fp16)[name = tensor("transpose_195")]; tensor input_987_cast_fp16 = conv(dilations = input_987_dilations_0, groups = input_987_groups_0, pad = input_987_pad_0, pad_type = input_987_pad_type_0, strides = input_987_strides_0, weight = encoder_layers_18_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_985_cast_fp16)[name = tensor("input_987_cast_fp16")]; tensor x_487_split_num_splits_0 = const()[name = tensor("x_487_split_num_splits_0"), val = tensor(2)]; tensor x_487_split_axis_0 = const()[name = tensor("x_487_split_axis_0"), val = tensor(1)]; tensor x_487_split_cast_fp16_0, tensor x_487_split_cast_fp16_1 = split(axis = x_487_split_axis_0, num_splits = x_487_split_num_splits_0, x = input_987_cast_fp16)[name = tensor("x_487_split_cast_fp16")]; tensor x_487_split_1_sigmoid_cast_fp16 = sigmoid(x = x_487_split_cast_fp16_1)[name = tensor("x_487_split_1_sigmoid_cast_fp16")]; tensor x_487_cast_fp16 = mul(x = x_487_split_cast_fp16_0, y = x_487_split_1_sigmoid_cast_fp16)[name = tensor("x_487_cast_fp16")]; tensor input_989_cast_fp16 = select(a = var_44_to_fp16, b = x_487_cast_fp16, cond = var_575)[name = tensor("input_989_cast_fp16")]; tensor new_x_75_interleave_0 = const()[name = tensor("new_x_75_interleave_0"), val = tensor(false)]; tensor new_x_75_cast_fp16 = concat(axis = var_59, interleave = new_x_75_interleave_0, values = (cache_75_cast_fp16, input_989_cast_fp16))[name = tensor("new_x_75_cast_fp16")]; tensor var_4422_begin_0 = const()[name = tensor("op_4422_begin_0"), val = tensor([0, 0, 7])]; tensor var_4422_end_0 = const()[name = tensor("op_4422_end_0"), val = tensor([1, 1024, 15])]; tensor var_4422_end_mask_0 = const()[name = tensor("op_4422_end_mask_0"), val = tensor([true, true, true])]; tensor var_4422_cast_fp16 = slice_by_index(begin = var_4422_begin_0, end = var_4422_end_0, end_mask = var_4422_end_mask_0, x = new_x_75_cast_fp16)[name = tensor("op_4422_cast_fp16")]; tensor x_489_pad_type_0 = const()[name = tensor("x_489_pad_type_0"), val = tensor("valid")]; tensor x_489_groups_0 = const()[name = tensor("x_489_groups_0"), val = tensor(1024)]; tensor x_489_strides_0 = const()[name = tensor("x_489_strides_0"), val = tensor([1])]; tensor x_489_pad_0 = const()[name = tensor("x_489_pad_0"), val = tensor([0, 0])]; tensor x_489_dilations_0 = const()[name = tensor("x_489_dilations_0"), val = tensor([1])]; tensor encoder_layers_18_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_18_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372944448))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372953728))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_489_cast_fp16 = conv(dilations = x_489_dilations_0, groups = x_489_groups_0, pad = x_489_pad_0, pad_type = x_489_pad_type_0, strides = x_489_strides_0, weight = encoder_layers_18_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_75_cast_fp16)[name = tensor("x_489_cast_fp16")]; tensor input_991_perm_0 = const()[name = tensor("input_991_perm_0"), val = tensor([0, 2, 1])]; tensor x_491_axes_0 = const()[name = tensor("x_491_axes_0"), val = tensor([-1])]; tensor encoder_layers_18_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_18_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372955840)))]; tensor encoder_layers_18_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_18_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372957952)))]; tensor input_991_cast_fp16 = transpose(perm = input_991_perm_0, x = x_489_cast_fp16)[name = tensor("transpose_194")]; tensor x_491_cast_fp16 = layer_norm(axes = x_491_axes_0, beta = encoder_layers_18_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_18_conv_batch_norm_weight_to_fp16, x = input_991_cast_fp16)[name = tensor("x_491_cast_fp16")]; tensor input_993_perm_0 = const()[name = tensor("input_993_perm_0"), val = tensor([0, 2, 1])]; tensor input_993_cast_fp16 = transpose(perm = input_993_perm_0, x = x_491_cast_fp16)[name = tensor("transpose_193")]; tensor input_995_cast_fp16 = silu(x = input_993_cast_fp16)[name = tensor("input_995_cast_fp16")]; tensor x_493_pad_type_0 = const()[name = tensor("x_493_pad_type_0"), val = tensor("valid")]; tensor x_493_strides_0 = const()[name = tensor("x_493_strides_0"), val = tensor([1])]; tensor x_493_pad_0 = const()[name = tensor("x_493_pad_0"), val = tensor([0, 0])]; tensor x_493_dilations_0 = const()[name = tensor("x_493_dilations_0"), val = tensor([1])]; tensor x_493_groups_0 = const()[name = tensor("x_493_groups_0"), val = tensor(1)]; tensor encoder_layers_18_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_18_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372960064))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(374008704))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_493_cast_fp16 = conv(dilations = x_493_dilations_0, groups = x_493_groups_0, pad = x_493_pad_0, pad_type = x_493_pad_type_0, strides = x_493_strides_0, weight = encoder_layers_18_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_995_cast_fp16)[name = tensor("x_493_cast_fp16")]; tensor input_997_perm_0 = const()[name = tensor("input_997_perm_0"), val = tensor([0, 2, 1])]; tensor input_997_cast_fp16 = transpose(perm = input_997_perm_0, x = x_493_cast_fp16)[name = tensor("transpose_192")]; tensor input_999_cast_fp16 = add(x = input_983_cast_fp16, y = input_997_cast_fp16)[name = tensor("input_999_cast_fp16")]; tensor input_1001_axes_0 = const()[name = tensor("input_1001_axes_0"), val = tensor([-1])]; tensor encoder_layers_18_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_18_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(374010816)))]; tensor encoder_layers_18_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_18_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(374012928)))]; tensor input_1001_cast_fp16 = layer_norm(axes = input_1001_axes_0, beta = encoder_layers_18_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_18_norm_feed_forward2_weight_to_fp16, x = input_999_cast_fp16)[name = tensor("input_1001_cast_fp16")]; tensor encoder_layers_18_feed_forward2_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_18_feed_forward2_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(374015040))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(378209408))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_18_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_18_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(378217664)))]; tensor linear_170_cast_fp16 = linear(bias = encoder_layers_18_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_18_feed_forward2_linear1_weight_to_fp16_quantized, x = input_1001_cast_fp16)[name = tensor("linear_170_cast_fp16")]; tensor input_1005_cast_fp16 = silu(x = linear_170_cast_fp16)[name = tensor("input_1005_cast_fp16")]; tensor encoder_layers_18_feed_forward2_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_18_feed_forward2_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(378225920))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382420288))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_18_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_18_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382422400)))]; tensor linear_171_cast_fp16 = linear(bias = encoder_layers_18_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_18_feed_forward2_linear2_weight_to_fp16_quantized, x = input_1005_cast_fp16)[name = tensor("linear_171_cast_fp16")]; tensor var_4465_to_fp16 = const()[name = tensor("op_4465_to_fp16"), val = tensor(0x1p-1)]; tensor var_4466_cast_fp16 = mul(x = linear_171_cast_fp16, y = var_4465_to_fp16)[name = tensor("op_4466_cast_fp16")]; tensor input_1011_cast_fp16 = add(x = input_999_cast_fp16, y = var_4466_cast_fp16)[name = tensor("input_1011_cast_fp16")]; tensor input_1013_axes_0 = const()[name = tensor("input_1013_axes_0"), val = tensor([-1])]; tensor encoder_layers_18_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_18_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382424512)))]; tensor encoder_layers_18_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_18_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382426624)))]; tensor input_1013_cast_fp16 = layer_norm(axes = input_1013_axes_0, beta = encoder_layers_18_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_18_norm_out_weight_to_fp16, x = input_1011_cast_fp16)[name = tensor("input_1013_cast_fp16")]; tensor cache_77_begin_0 = const()[name = tensor("cache_77_begin_0"), val = tensor([19, 0, 0, 0])]; tensor cache_77_end_0 = const()[name = tensor("cache_77_end_0"), val = tensor([20, 1, 42, 1024])]; tensor cache_77_end_mask_0 = const()[name = tensor("cache_77_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_77_squeeze_mask_0 = const()[name = tensor("cache_77_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_77_cast_fp16 = slice_by_index(begin = cache_77_begin_0, end = cache_77_end_0, end_mask = cache_77_end_mask_0, squeeze_mask = cache_77_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_77_cast_fp16")]; tensor cache_79_begin_0 = const()[name = tensor("cache_79_begin_0"), val = tensor([19, 0, 0, 0])]; tensor cache_79_end_0 = const()[name = tensor("cache_79_end_0"), val = tensor([20, 1, 1024, 8])]; tensor cache_79_end_mask_0 = const()[name = tensor("cache_79_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_79_squeeze_mask_0 = const()[name = tensor("cache_79_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_79_cast_fp16 = slice_by_index(begin = cache_79_begin_0, end = cache_79_end_0, end_mask = cache_79_end_mask_0, squeeze_mask = cache_79_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_79_cast_fp16")]; tensor input_1015_axes_0 = const()[name = tensor("input_1015_axes_0"), val = tensor([-1])]; tensor encoder_layers_19_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_19_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382428736)))]; tensor encoder_layers_19_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_19_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382430848)))]; tensor input_1015_cast_fp16 = layer_norm(axes = input_1015_axes_0, beta = encoder_layers_19_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_19_norm_feed_forward1_weight_to_fp16, x = input_1013_cast_fp16)[name = tensor("input_1015_cast_fp16")]; tensor encoder_layers_19_feed_forward1_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_feed_forward1_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382432960))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386627328))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_19_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_19_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386635584)))]; tensor linear_172_cast_fp16 = linear(bias = encoder_layers_19_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_19_feed_forward1_linear1_weight_to_fp16_quantized, x = input_1015_cast_fp16)[name = tensor("linear_172_cast_fp16")]; tensor input_1019_cast_fp16 = silu(x = linear_172_cast_fp16)[name = tensor("input_1019_cast_fp16")]; tensor encoder_layers_19_feed_forward1_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_feed_forward1_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386643840))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390838208))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_19_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_19_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390840320)))]; tensor linear_173_cast_fp16 = linear(bias = encoder_layers_19_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_19_feed_forward1_linear2_weight_to_fp16_quantized, x = input_1019_cast_fp16)[name = tensor("linear_173_cast_fp16")]; tensor var_4502_to_fp16 = const()[name = tensor("op_4502_to_fp16"), val = tensor(0x1p-1)]; tensor var_4503_cast_fp16 = mul(x = linear_173_cast_fp16, y = var_4502_to_fp16)[name = tensor("op_4503_cast_fp16")]; tensor input_1025_cast_fp16 = add(x = input_1013_cast_fp16, y = var_4503_cast_fp16)[name = tensor("input_1025_cast_fp16")]; tensor key_39_axes_0 = const()[name = tensor("key_39_axes_0"), val = tensor([-1])]; tensor encoder_layers_19_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_19_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390842432)))]; tensor encoder_layers_19_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_19_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390844544)))]; tensor key_39_cast_fp16 = layer_norm(axes = key_39_axes_0, beta = encoder_layers_19_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_19_norm_self_att_weight_to_fp16, x = input_1025_cast_fp16)[name = tensor("key_39_cast_fp16")]; tensor input_1027_interleave_0 = const()[name = tensor("input_1027_interleave_0"), val = tensor(false)]; tensor input_1027_cast_fp16 = concat(axis = var_68, interleave = input_1027_interleave_0, values = (cache_77_cast_fp16, key_39_cast_fp16))[name = tensor("input_1027_cast_fp16")]; tensor var_4525_begin_0 = const()[name = tensor("op_4525_begin_0"), val = tensor([0, 7, 0])]; tensor var_4525_end_0 = const()[name = tensor("op_4525_end_0"), val = tensor([1, 42, 1024])]; tensor var_4525_end_mask_0 = const()[name = tensor("op_4525_end_mask_0"), val = tensor([true, true, true])]; tensor var_4525_cast_fp16 = slice_by_index(begin = var_4525_begin_0, end = var_4525_end_0, end_mask = var_4525_end_mask_0, x = cache_77_cast_fp16)[name = tensor("op_4525_cast_fp16")]; tensor var_4531_interleave_0 = const()[name = tensor("op_4531_interleave_0"), val = tensor(false)]; tensor var_4531_cast_fp16 = concat(axis = var_68, interleave = var_4531_interleave_0, values = (var_4525_cast_fp16, key_39_cast_fp16))[name = tensor("op_4531_cast_fp16")]; tensor encoder_layers_19_self_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_self_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390846656))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(391895296))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_19_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(391897408)))]; tensor linear_174_cast_fp16 = linear(bias = encoder_layers_19_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_19_self_attn_linear_q_weight_to_fp16_quantized, x = key_39_cast_fp16)[name = tensor("linear_174_cast_fp16")]; tensor var_4536 = const()[name = tensor("op_4536"), val = tensor([1, -1, 8, 128])]; tensor q_115_cast_fp16 = reshape(shape = var_4536, x = linear_174_cast_fp16)[name = tensor("q_115_cast_fp16")]; tensor encoder_layers_19_self_attn_linear_k_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_self_attn_linear_k_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(391899520))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(392948160))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_19_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(392950272)))]; tensor linear_175_cast_fp16 = linear(bias = encoder_layers_19_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_19_self_attn_linear_k_weight_to_fp16_quantized, x = input_1027_cast_fp16)[name = tensor("linear_175_cast_fp16")]; tensor var_4541 = const()[name = tensor("op_4541"), val = tensor([1, -1, 8, 128])]; tensor k_77_cast_fp16 = reshape(shape = var_4541, x = linear_175_cast_fp16)[name = tensor("k_77_cast_fp16")]; tensor encoder_layers_19_self_attn_linear_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_self_attn_linear_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(392952384))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394001024))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_19_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394003136)))]; tensor linear_176_cast_fp16 = linear(bias = encoder_layers_19_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_19_self_attn_linear_v_weight_to_fp16_quantized, x = input_1027_cast_fp16)[name = tensor("linear_176_cast_fp16")]; tensor var_4546 = const()[name = tensor("op_4546"), val = tensor([1, -1, 8, 128])]; tensor v_39_cast_fp16 = reshape(shape = var_4546, x = linear_176_cast_fp16)[name = tensor("v_39_cast_fp16")]; tensor value_47_perm_0 = const()[name = tensor("value_47_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_19_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394005248)))]; tensor var_4559_cast_fp16 = add(x = q_115_cast_fp16, y = encoder_layers_19_self_attn_pos_bias_u_to_fp16)[name = tensor("op_4559_cast_fp16")]; tensor encoder_layers_19_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394007360)))]; tensor var_4561_cast_fp16 = add(x = q_115_cast_fp16, y = encoder_layers_19_self_attn_pos_bias_v_to_fp16)[name = tensor("op_4561_cast_fp16")]; tensor q_with_bias_v_39_perm_0 = const()[name = tensor("q_with_bias_v_39_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_501_transpose_x_0 = const()[name = tensor("x_501_transpose_x_0"), val = tensor(false)]; tensor x_501_transpose_y_0 = const()[name = tensor("x_501_transpose_y_0"), val = tensor(false)]; tensor op_4563_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_4563_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394009472))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394109056))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394108864)))]; tensor q_with_bias_v_39_cast_fp16 = transpose(perm = q_with_bias_v_39_perm_0, x = var_4561_cast_fp16)[name = tensor("transpose_191")]; tensor x_501_cast_fp16 = matmul(transpose_x = x_501_transpose_x_0, transpose_y = x_501_transpose_y_0, x = q_with_bias_v_39_cast_fp16, y = op_4563_to_fp16_quantized)[name = tensor("x_501_cast_fp16")]; tensor x_503_pad_0 = const()[name = tensor("x_503_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_503_mode_0 = const()[name = tensor("x_503_mode_0"), val = tensor("constant")]; tensor const_326_to_fp16 = const()[name = tensor("const_326_to_fp16"), val = tensor(0x0p+0)]; tensor x_503_cast_fp16 = pad(constant_val = const_326_to_fp16, mode = x_503_mode_0, pad = x_503_pad_0, x = x_501_cast_fp16)[name = tensor("x_503_cast_fp16")]; tensor var_4571 = const()[name = tensor("op_4571"), val = tensor([1, 8, -1, 7])]; tensor x_505_cast_fp16 = reshape(shape = var_4571, x = x_503_cast_fp16)[name = tensor("x_505_cast_fp16")]; tensor var_4575_begin_0 = const()[name = tensor("op_4575_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_4575_end_0 = const()[name = tensor("op_4575_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_4575_end_mask_0 = const()[name = tensor("op_4575_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_4575_cast_fp16 = slice_by_index(begin = var_4575_begin_0, end = var_4575_end_0, end_mask = var_4575_end_mask_0, x = x_505_cast_fp16)[name = tensor("op_4575_cast_fp16")]; tensor var_4576 = const()[name = tensor("op_4576"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_77_cast_fp16 = reshape(shape = var_4576, x = var_4575_cast_fp16)[name = tensor("matrix_bd_77_cast_fp16")]; tensor matrix_ac_39_transpose_x_0 = const()[name = tensor("matrix_ac_39_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_39_transpose_y_0 = const()[name = tensor("matrix_ac_39_transpose_y_0"), val = tensor(false)]; tensor transpose_134_perm_0 = const()[name = tensor("transpose_134_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_135_perm_0 = const()[name = tensor("transpose_135_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_135 = transpose(perm = transpose_135_perm_0, x = k_77_cast_fp16)[name = tensor("transpose_189")]; tensor transpose_134 = transpose(perm = transpose_134_perm_0, x = var_4559_cast_fp16)[name = tensor("transpose_190")]; tensor matrix_ac_39_cast_fp16 = matmul(transpose_x = matrix_ac_39_transpose_x_0, transpose_y = matrix_ac_39_transpose_y_0, x = transpose_134, y = transpose_135)[name = tensor("matrix_ac_39_cast_fp16")]; tensor matrix_bd_79_begin_0 = const()[name = tensor("matrix_bd_79_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_79_end_0 = const()[name = tensor("matrix_bd_79_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_79_end_mask_0 = const()[name = tensor("matrix_bd_79_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_79_cast_fp16 = slice_by_index(begin = matrix_bd_79_begin_0, end = matrix_bd_79_end_0, end_mask = matrix_bd_79_end_mask_0, x = matrix_bd_77_cast_fp16)[name = tensor("matrix_bd_79_cast_fp16")]; tensor var_4585_cast_fp16 = add(x = matrix_ac_39_cast_fp16, y = matrix_bd_79_cast_fp16)[name = tensor("op_4585_cast_fp16")]; tensor _inversed_scores_77_y_0_to_fp16 = const()[name = tensor("_inversed_scores_77_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_77_cast_fp16 = mul(x = var_4585_cast_fp16, y = _inversed_scores_77_y_0_to_fp16)[name = tensor("_inversed_scores_77_cast_fp16")]; tensor scores_79_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_77_cast_fp16, cond = mask_11)[name = tensor("scores_79_cast_fp16")]; tensor var_4591_cast_fp16 = softmax(axis = var_59, x = scores_79_cast_fp16)[name = tensor("op_4591_cast_fp16")]; tensor input_1029_cast_fp16 = select(a = var_44_to_fp16, b = var_4591_cast_fp16, cond = mask_11)[name = tensor("input_1029_cast_fp16")]; tensor x_507_transpose_x_0 = const()[name = tensor("x_507_transpose_x_0"), val = tensor(false)]; tensor x_507_transpose_y_0 = const()[name = tensor("x_507_transpose_y_0"), val = tensor(false)]; tensor value_47_cast_fp16 = transpose(perm = value_47_perm_0, x = v_39_cast_fp16)[name = tensor("transpose_188")]; tensor x_507_cast_fp16 = matmul(transpose_x = x_507_transpose_x_0, transpose_y = x_507_transpose_y_0, x = input_1029_cast_fp16, y = value_47_cast_fp16)[name = tensor("x_507_cast_fp16")]; tensor var_4595_perm_0 = const()[name = tensor("op_4595_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4596 = const()[name = tensor("op_4596"), val = tensor([1, -1, 1024])]; tensor var_4595_cast_fp16 = transpose(perm = var_4595_perm_0, x = x_507_cast_fp16)[name = tensor("transpose_187")]; tensor input_1031_cast_fp16 = reshape(shape = var_4596, x = var_4595_cast_fp16)[name = tensor("input_1031_cast_fp16")]; tensor encoder_layers_19_self_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_self_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394109376))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(395158016))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_19_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(395160128)))]; tensor linear_178_cast_fp16 = linear(bias = encoder_layers_19_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_19_self_attn_linear_out_weight_to_fp16_quantized, x = input_1031_cast_fp16)[name = tensor("linear_178_cast_fp16")]; tensor input_1035_cast_fp16 = add(x = input_1025_cast_fp16, y = linear_178_cast_fp16)[name = tensor("input_1035_cast_fp16")]; tensor x_511_axes_0 = const()[name = tensor("x_511_axes_0"), val = tensor([-1])]; tensor encoder_layers_19_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_19_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(395162240)))]; tensor encoder_layers_19_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_19_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(395164352)))]; tensor x_511_cast_fp16 = layer_norm(axes = x_511_axes_0, beta = encoder_layers_19_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_19_norm_conv_weight_to_fp16, x = input_1035_cast_fp16)[name = tensor("x_511_cast_fp16")]; tensor input_1037_perm_0 = const()[name = tensor("input_1037_perm_0"), val = tensor([0, 2, 1])]; tensor input_1039_pad_type_0 = const()[name = tensor("input_1039_pad_type_0"), val = tensor("valid")]; tensor input_1039_strides_0 = const()[name = tensor("input_1039_strides_0"), val = tensor([1])]; tensor input_1039_pad_0 = const()[name = tensor("input_1039_pad_0"), val = tensor([0, 0])]; tensor input_1039_dilations_0 = const()[name = tensor("input_1039_dilations_0"), val = tensor([1])]; tensor input_1039_groups_0 = const()[name = tensor("input_1039_groups_0"), val = tensor(1)]; tensor encoder_layers_19_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(395166464))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(397263680))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_1037_cast_fp16 = transpose(perm = input_1037_perm_0, x = x_511_cast_fp16)[name = tensor("transpose_186")]; tensor input_1039_cast_fp16 = conv(dilations = input_1039_dilations_0, groups = input_1039_groups_0, pad = input_1039_pad_0, pad_type = input_1039_pad_type_0, strides = input_1039_strides_0, weight = encoder_layers_19_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_1037_cast_fp16)[name = tensor("input_1039_cast_fp16")]; tensor x_513_split_num_splits_0 = const()[name = tensor("x_513_split_num_splits_0"), val = tensor(2)]; tensor x_513_split_axis_0 = const()[name = tensor("x_513_split_axis_0"), val = tensor(1)]; tensor x_513_split_cast_fp16_0, tensor x_513_split_cast_fp16_1 = split(axis = x_513_split_axis_0, num_splits = x_513_split_num_splits_0, x = input_1039_cast_fp16)[name = tensor("x_513_split_cast_fp16")]; tensor x_513_split_1_sigmoid_cast_fp16 = sigmoid(x = x_513_split_cast_fp16_1)[name = tensor("x_513_split_1_sigmoid_cast_fp16")]; tensor x_513_cast_fp16 = mul(x = x_513_split_cast_fp16_0, y = x_513_split_1_sigmoid_cast_fp16)[name = tensor("x_513_cast_fp16")]; tensor input_1041_cast_fp16 = select(a = var_44_to_fp16, b = x_513_cast_fp16, cond = var_575)[name = tensor("input_1041_cast_fp16")]; tensor new_x_79_interleave_0 = const()[name = tensor("new_x_79_interleave_0"), val = tensor(false)]; tensor new_x_79_cast_fp16 = concat(axis = var_59, interleave = new_x_79_interleave_0, values = (cache_79_cast_fp16, input_1041_cast_fp16))[name = tensor("new_x_79_cast_fp16")]; tensor var_4635_begin_0 = const()[name = tensor("op_4635_begin_0"), val = tensor([0, 0, 7])]; tensor var_4635_end_0 = const()[name = tensor("op_4635_end_0"), val = tensor([1, 1024, 15])]; tensor var_4635_end_mask_0 = const()[name = tensor("op_4635_end_mask_0"), val = tensor([true, true, true])]; tensor var_4635_cast_fp16 = slice_by_index(begin = var_4635_begin_0, end = var_4635_end_0, end_mask = var_4635_end_mask_0, x = new_x_79_cast_fp16)[name = tensor("op_4635_cast_fp16")]; tensor x_515_pad_type_0 = const()[name = tensor("x_515_pad_type_0"), val = tensor("valid")]; tensor x_515_groups_0 = const()[name = tensor("x_515_groups_0"), val = tensor(1024)]; tensor x_515_strides_0 = const()[name = tensor("x_515_strides_0"), val = tensor([1])]; tensor x_515_pad_0 = const()[name = tensor("x_515_pad_0"), val = tensor([0, 0])]; tensor x_515_dilations_0 = const()[name = tensor("x_515_dilations_0"), val = tensor([1])]; tensor encoder_layers_19_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(397267840))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(397277120))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_515_cast_fp16 = conv(dilations = x_515_dilations_0, groups = x_515_groups_0, pad = x_515_pad_0, pad_type = x_515_pad_type_0, strides = x_515_strides_0, weight = encoder_layers_19_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_79_cast_fp16)[name = tensor("x_515_cast_fp16")]; tensor input_1043_perm_0 = const()[name = tensor("input_1043_perm_0"), val = tensor([0, 2, 1])]; tensor x_517_axes_0 = const()[name = tensor("x_517_axes_0"), val = tensor([-1])]; tensor encoder_layers_19_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_19_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(397279232)))]; tensor encoder_layers_19_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_19_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(397281344)))]; tensor input_1043_cast_fp16 = transpose(perm = input_1043_perm_0, x = x_515_cast_fp16)[name = tensor("transpose_185")]; tensor x_517_cast_fp16 = layer_norm(axes = x_517_axes_0, beta = encoder_layers_19_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_19_conv_batch_norm_weight_to_fp16, x = input_1043_cast_fp16)[name = tensor("x_517_cast_fp16")]; tensor input_1045_perm_0 = const()[name = tensor("input_1045_perm_0"), val = tensor([0, 2, 1])]; tensor input_1045_cast_fp16 = transpose(perm = input_1045_perm_0, x = x_517_cast_fp16)[name = tensor("transpose_184")]; tensor input_1047_cast_fp16 = silu(x = input_1045_cast_fp16)[name = tensor("input_1047_cast_fp16")]; tensor x_519_pad_type_0 = const()[name = tensor("x_519_pad_type_0"), val = tensor("valid")]; tensor x_519_strides_0 = const()[name = tensor("x_519_strides_0"), val = tensor([1])]; tensor x_519_pad_0 = const()[name = tensor("x_519_pad_0"), val = tensor([0, 0])]; tensor x_519_dilations_0 = const()[name = tensor("x_519_dilations_0"), val = tensor([1])]; tensor x_519_groups_0 = const()[name = tensor("x_519_groups_0"), val = tensor(1)]; tensor encoder_layers_19_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(397283456))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(398332096))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_519_cast_fp16 = conv(dilations = x_519_dilations_0, groups = x_519_groups_0, pad = x_519_pad_0, pad_type = x_519_pad_type_0, strides = x_519_strides_0, weight = encoder_layers_19_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_1047_cast_fp16)[name = tensor("x_519_cast_fp16")]; tensor input_1049_perm_0 = const()[name = tensor("input_1049_perm_0"), val = tensor([0, 2, 1])]; tensor input_1049_cast_fp16 = transpose(perm = input_1049_perm_0, x = x_519_cast_fp16)[name = tensor("transpose_183")]; tensor input_1051_cast_fp16 = add(x = input_1035_cast_fp16, y = input_1049_cast_fp16)[name = tensor("input_1051_cast_fp16")]; tensor input_1053_axes_0 = const()[name = tensor("input_1053_axes_0"), val = tensor([-1])]; tensor encoder_layers_19_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_19_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(398334208)))]; tensor encoder_layers_19_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_19_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(398336320)))]; tensor input_1053_cast_fp16 = layer_norm(axes = input_1053_axes_0, beta = encoder_layers_19_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_19_norm_feed_forward2_weight_to_fp16, x = input_1051_cast_fp16)[name = tensor("input_1053_cast_fp16")]; tensor encoder_layers_19_feed_forward2_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_feed_forward2_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(398338432))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(402532800))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_19_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_19_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(402541056)))]; tensor linear_179_cast_fp16 = linear(bias = encoder_layers_19_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_19_feed_forward2_linear1_weight_to_fp16_quantized, x = input_1053_cast_fp16)[name = tensor("linear_179_cast_fp16")]; tensor input_1057_cast_fp16 = silu(x = linear_179_cast_fp16)[name = tensor("input_1057_cast_fp16")]; tensor encoder_layers_19_feed_forward2_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_19_feed_forward2_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(402549312))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406743680))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_19_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_19_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406745792)))]; tensor linear_180_cast_fp16 = linear(bias = encoder_layers_19_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_19_feed_forward2_linear2_weight_to_fp16_quantized, x = input_1057_cast_fp16)[name = tensor("linear_180_cast_fp16")]; tensor var_4678_to_fp16 = const()[name = tensor("op_4678_to_fp16"), val = tensor(0x1p-1)]; tensor var_4679_cast_fp16 = mul(x = linear_180_cast_fp16, y = var_4678_to_fp16)[name = tensor("op_4679_cast_fp16")]; tensor input_1063_cast_fp16 = add(x = input_1051_cast_fp16, y = var_4679_cast_fp16)[name = tensor("input_1063_cast_fp16")]; tensor input_1065_axes_0 = const()[name = tensor("input_1065_axes_0"), val = tensor([-1])]; tensor encoder_layers_19_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_19_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406747904)))]; tensor encoder_layers_19_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_19_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406750016)))]; tensor input_1065_cast_fp16 = layer_norm(axes = input_1065_axes_0, beta = encoder_layers_19_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_19_norm_out_weight_to_fp16, x = input_1063_cast_fp16)[name = tensor("input_1065_cast_fp16")]; tensor cache_81_begin_0 = const()[name = tensor("cache_81_begin_0"), val = tensor([20, 0, 0, 0])]; tensor cache_81_end_0 = const()[name = tensor("cache_81_end_0"), val = tensor([21, 1, 42, 1024])]; tensor cache_81_end_mask_0 = const()[name = tensor("cache_81_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_81_squeeze_mask_0 = const()[name = tensor("cache_81_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_81_cast_fp16 = slice_by_index(begin = cache_81_begin_0, end = cache_81_end_0, end_mask = cache_81_end_mask_0, squeeze_mask = cache_81_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_81_cast_fp16")]; tensor cache_83_begin_0 = const()[name = tensor("cache_83_begin_0"), val = tensor([20, 0, 0, 0])]; tensor cache_83_end_0 = const()[name = tensor("cache_83_end_0"), val = tensor([21, 1, 1024, 8])]; tensor cache_83_end_mask_0 = const()[name = tensor("cache_83_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_83_squeeze_mask_0 = const()[name = tensor("cache_83_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_83_cast_fp16 = slice_by_index(begin = cache_83_begin_0, end = cache_83_end_0, end_mask = cache_83_end_mask_0, squeeze_mask = cache_83_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_83_cast_fp16")]; tensor input_1067_axes_0 = const()[name = tensor("input_1067_axes_0"), val = tensor([-1])]; tensor encoder_layers_20_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_20_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406752128)))]; tensor encoder_layers_20_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_20_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406754240)))]; tensor input_1067_cast_fp16 = layer_norm(axes = input_1067_axes_0, beta = encoder_layers_20_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_20_norm_feed_forward1_weight_to_fp16, x = input_1065_cast_fp16)[name = tensor("input_1067_cast_fp16")]; tensor encoder_layers_20_feed_forward1_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_feed_forward1_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406756352))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(410950720))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_20_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_20_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(410958976)))]; tensor linear_181_cast_fp16 = linear(bias = encoder_layers_20_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_20_feed_forward1_linear1_weight_to_fp16_quantized, x = input_1067_cast_fp16)[name = tensor("linear_181_cast_fp16")]; tensor input_1071_cast_fp16 = silu(x = linear_181_cast_fp16)[name = tensor("input_1071_cast_fp16")]; tensor encoder_layers_20_feed_forward1_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_feed_forward1_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(410967232))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415161600))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_20_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_20_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415163712)))]; tensor linear_182_cast_fp16 = linear(bias = encoder_layers_20_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_20_feed_forward1_linear2_weight_to_fp16_quantized, x = input_1071_cast_fp16)[name = tensor("linear_182_cast_fp16")]; tensor var_4715_to_fp16 = const()[name = tensor("op_4715_to_fp16"), val = tensor(0x1p-1)]; tensor var_4716_cast_fp16 = mul(x = linear_182_cast_fp16, y = var_4715_to_fp16)[name = tensor("op_4716_cast_fp16")]; tensor input_1077_cast_fp16 = add(x = input_1065_cast_fp16, y = var_4716_cast_fp16)[name = tensor("input_1077_cast_fp16")]; tensor key_41_axes_0 = const()[name = tensor("key_41_axes_0"), val = tensor([-1])]; tensor encoder_layers_20_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_20_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415165824)))]; tensor encoder_layers_20_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_20_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415167936)))]; tensor key_41_cast_fp16 = layer_norm(axes = key_41_axes_0, beta = encoder_layers_20_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_20_norm_self_att_weight_to_fp16, x = input_1077_cast_fp16)[name = tensor("key_41_cast_fp16")]; tensor input_1079_interleave_0 = const()[name = tensor("input_1079_interleave_0"), val = tensor(false)]; tensor input_1079_cast_fp16 = concat(axis = var_68, interleave = input_1079_interleave_0, values = (cache_81_cast_fp16, key_41_cast_fp16))[name = tensor("input_1079_cast_fp16")]; tensor var_4738_begin_0 = const()[name = tensor("op_4738_begin_0"), val = tensor([0, 7, 0])]; tensor var_4738_end_0 = const()[name = tensor("op_4738_end_0"), val = tensor([1, 42, 1024])]; tensor var_4738_end_mask_0 = const()[name = tensor("op_4738_end_mask_0"), val = tensor([true, true, true])]; tensor var_4738_cast_fp16 = slice_by_index(begin = var_4738_begin_0, end = var_4738_end_0, end_mask = var_4738_end_mask_0, x = cache_81_cast_fp16)[name = tensor("op_4738_cast_fp16")]; tensor var_4744_interleave_0 = const()[name = tensor("op_4744_interleave_0"), val = tensor(false)]; tensor var_4744_cast_fp16 = concat(axis = var_68, interleave = var_4744_interleave_0, values = (var_4738_cast_fp16, key_41_cast_fp16))[name = tensor("op_4744_cast_fp16")]; tensor encoder_layers_20_self_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_self_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415170048))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416218688))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_20_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416220800)))]; tensor linear_183_cast_fp16 = linear(bias = encoder_layers_20_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_20_self_attn_linear_q_weight_to_fp16_quantized, x = key_41_cast_fp16)[name = tensor("linear_183_cast_fp16")]; tensor var_4749 = const()[name = tensor("op_4749"), val = tensor([1, -1, 8, 128])]; tensor q_121_cast_fp16 = reshape(shape = var_4749, x = linear_183_cast_fp16)[name = tensor("q_121_cast_fp16")]; tensor encoder_layers_20_self_attn_linear_k_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_self_attn_linear_k_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416222912))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(417271552))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_20_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(417273664)))]; tensor linear_184_cast_fp16 = linear(bias = encoder_layers_20_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_20_self_attn_linear_k_weight_to_fp16_quantized, x = input_1079_cast_fp16)[name = tensor("linear_184_cast_fp16")]; tensor var_4754 = const()[name = tensor("op_4754"), val = tensor([1, -1, 8, 128])]; tensor k_81_cast_fp16 = reshape(shape = var_4754, x = linear_184_cast_fp16)[name = tensor("k_81_cast_fp16")]; tensor encoder_layers_20_self_attn_linear_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_self_attn_linear_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(417275776))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418324416))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_20_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418326528)))]; tensor linear_185_cast_fp16 = linear(bias = encoder_layers_20_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_20_self_attn_linear_v_weight_to_fp16_quantized, x = input_1079_cast_fp16)[name = tensor("linear_185_cast_fp16")]; tensor var_4759 = const()[name = tensor("op_4759"), val = tensor([1, -1, 8, 128])]; tensor v_41_cast_fp16 = reshape(shape = var_4759, x = linear_185_cast_fp16)[name = tensor("v_41_cast_fp16")]; tensor value_49_perm_0 = const()[name = tensor("value_49_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_20_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418328640)))]; tensor var_4772_cast_fp16 = add(x = q_121_cast_fp16, y = encoder_layers_20_self_attn_pos_bias_u_to_fp16)[name = tensor("op_4772_cast_fp16")]; tensor encoder_layers_20_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418330752)))]; tensor var_4774_cast_fp16 = add(x = q_121_cast_fp16, y = encoder_layers_20_self_attn_pos_bias_v_to_fp16)[name = tensor("op_4774_cast_fp16")]; tensor q_with_bias_v_41_perm_0 = const()[name = tensor("q_with_bias_v_41_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_527_transpose_x_0 = const()[name = tensor("x_527_transpose_x_0"), val = tensor(false)]; tensor x_527_transpose_y_0 = const()[name = tensor("x_527_transpose_y_0"), val = tensor(false)]; tensor op_4776_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_4776_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418332864))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418432448))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418432256)))]; tensor q_with_bias_v_41_cast_fp16 = transpose(perm = q_with_bias_v_41_perm_0, x = var_4774_cast_fp16)[name = tensor("transpose_182")]; tensor x_527_cast_fp16 = matmul(transpose_x = x_527_transpose_x_0, transpose_y = x_527_transpose_y_0, x = q_with_bias_v_41_cast_fp16, y = op_4776_to_fp16_quantized)[name = tensor("x_527_cast_fp16")]; tensor x_529_pad_0 = const()[name = tensor("x_529_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_529_mode_0 = const()[name = tensor("x_529_mode_0"), val = tensor("constant")]; tensor const_339_to_fp16 = const()[name = tensor("const_339_to_fp16"), val = tensor(0x0p+0)]; tensor x_529_cast_fp16 = pad(constant_val = const_339_to_fp16, mode = x_529_mode_0, pad = x_529_pad_0, x = x_527_cast_fp16)[name = tensor("x_529_cast_fp16")]; tensor var_4784 = const()[name = tensor("op_4784"), val = tensor([1, 8, -1, 7])]; tensor x_531_cast_fp16 = reshape(shape = var_4784, x = x_529_cast_fp16)[name = tensor("x_531_cast_fp16")]; tensor var_4788_begin_0 = const()[name = tensor("op_4788_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_4788_end_0 = const()[name = tensor("op_4788_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_4788_end_mask_0 = const()[name = tensor("op_4788_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_4788_cast_fp16 = slice_by_index(begin = var_4788_begin_0, end = var_4788_end_0, end_mask = var_4788_end_mask_0, x = x_531_cast_fp16)[name = tensor("op_4788_cast_fp16")]; tensor var_4789 = const()[name = tensor("op_4789"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_81_cast_fp16 = reshape(shape = var_4789, x = var_4788_cast_fp16)[name = tensor("matrix_bd_81_cast_fp16")]; tensor matrix_ac_41_transpose_x_0 = const()[name = tensor("matrix_ac_41_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_41_transpose_y_0 = const()[name = tensor("matrix_ac_41_transpose_y_0"), val = tensor(false)]; tensor transpose_136_perm_0 = const()[name = tensor("transpose_136_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_137_perm_0 = const()[name = tensor("transpose_137_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_137 = transpose(perm = transpose_137_perm_0, x = k_81_cast_fp16)[name = tensor("transpose_180")]; tensor transpose_136 = transpose(perm = transpose_136_perm_0, x = var_4772_cast_fp16)[name = tensor("transpose_181")]; tensor matrix_ac_41_cast_fp16 = matmul(transpose_x = matrix_ac_41_transpose_x_0, transpose_y = matrix_ac_41_transpose_y_0, x = transpose_136, y = transpose_137)[name = tensor("matrix_ac_41_cast_fp16")]; tensor matrix_bd_83_begin_0 = const()[name = tensor("matrix_bd_83_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_83_end_0 = const()[name = tensor("matrix_bd_83_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_83_end_mask_0 = const()[name = tensor("matrix_bd_83_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_83_cast_fp16 = slice_by_index(begin = matrix_bd_83_begin_0, end = matrix_bd_83_end_0, end_mask = matrix_bd_83_end_mask_0, x = matrix_bd_81_cast_fp16)[name = tensor("matrix_bd_83_cast_fp16")]; tensor var_4798_cast_fp16 = add(x = matrix_ac_41_cast_fp16, y = matrix_bd_83_cast_fp16)[name = tensor("op_4798_cast_fp16")]; tensor _inversed_scores_81_y_0_to_fp16 = const()[name = tensor("_inversed_scores_81_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_81_cast_fp16 = mul(x = var_4798_cast_fp16, y = _inversed_scores_81_y_0_to_fp16)[name = tensor("_inversed_scores_81_cast_fp16")]; tensor scores_83_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_81_cast_fp16, cond = mask_11)[name = tensor("scores_83_cast_fp16")]; tensor var_4804_cast_fp16 = softmax(axis = var_59, x = scores_83_cast_fp16)[name = tensor("op_4804_cast_fp16")]; tensor input_1081_cast_fp16 = select(a = var_44_to_fp16, b = var_4804_cast_fp16, cond = mask_11)[name = tensor("input_1081_cast_fp16")]; tensor x_533_transpose_x_0 = const()[name = tensor("x_533_transpose_x_0"), val = tensor(false)]; tensor x_533_transpose_y_0 = const()[name = tensor("x_533_transpose_y_0"), val = tensor(false)]; tensor value_49_cast_fp16 = transpose(perm = value_49_perm_0, x = v_41_cast_fp16)[name = tensor("transpose_179")]; tensor x_533_cast_fp16 = matmul(transpose_x = x_533_transpose_x_0, transpose_y = x_533_transpose_y_0, x = input_1081_cast_fp16, y = value_49_cast_fp16)[name = tensor("x_533_cast_fp16")]; tensor var_4808_perm_0 = const()[name = tensor("op_4808_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_4809 = const()[name = tensor("op_4809"), val = tensor([1, -1, 1024])]; tensor var_4808_cast_fp16 = transpose(perm = var_4808_perm_0, x = x_533_cast_fp16)[name = tensor("transpose_178")]; tensor input_1083_cast_fp16 = reshape(shape = var_4809, x = var_4808_cast_fp16)[name = tensor("input_1083_cast_fp16")]; tensor encoder_layers_20_self_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_self_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418432768))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419481408))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_20_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419483520)))]; tensor linear_187_cast_fp16 = linear(bias = encoder_layers_20_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_20_self_attn_linear_out_weight_to_fp16_quantized, x = input_1083_cast_fp16)[name = tensor("linear_187_cast_fp16")]; tensor input_1087_cast_fp16 = add(x = input_1077_cast_fp16, y = linear_187_cast_fp16)[name = tensor("input_1087_cast_fp16")]; tensor x_537_axes_0 = const()[name = tensor("x_537_axes_0"), val = tensor([-1])]; tensor encoder_layers_20_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_20_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419485632)))]; tensor encoder_layers_20_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_20_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419487744)))]; tensor x_537_cast_fp16 = layer_norm(axes = x_537_axes_0, beta = encoder_layers_20_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_20_norm_conv_weight_to_fp16, x = input_1087_cast_fp16)[name = tensor("x_537_cast_fp16")]; tensor input_1089_perm_0 = const()[name = tensor("input_1089_perm_0"), val = tensor([0, 2, 1])]; tensor input_1091_pad_type_0 = const()[name = tensor("input_1091_pad_type_0"), val = tensor("valid")]; tensor input_1091_strides_0 = const()[name = tensor("input_1091_strides_0"), val = tensor([1])]; tensor input_1091_pad_0 = const()[name = tensor("input_1091_pad_0"), val = tensor([0, 0])]; tensor input_1091_dilations_0 = const()[name = tensor("input_1091_dilations_0"), val = tensor([1])]; tensor input_1091_groups_0 = const()[name = tensor("input_1091_groups_0"), val = tensor(1)]; tensor encoder_layers_20_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419489856))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421587072))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_1089_cast_fp16 = transpose(perm = input_1089_perm_0, x = x_537_cast_fp16)[name = tensor("transpose_177")]; tensor input_1091_cast_fp16 = conv(dilations = input_1091_dilations_0, groups = input_1091_groups_0, pad = input_1091_pad_0, pad_type = input_1091_pad_type_0, strides = input_1091_strides_0, weight = encoder_layers_20_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_1089_cast_fp16)[name = tensor("input_1091_cast_fp16")]; tensor x_539_split_num_splits_0 = const()[name = tensor("x_539_split_num_splits_0"), val = tensor(2)]; tensor x_539_split_axis_0 = const()[name = tensor("x_539_split_axis_0"), val = tensor(1)]; tensor x_539_split_cast_fp16_0, tensor x_539_split_cast_fp16_1 = split(axis = x_539_split_axis_0, num_splits = x_539_split_num_splits_0, x = input_1091_cast_fp16)[name = tensor("x_539_split_cast_fp16")]; tensor x_539_split_1_sigmoid_cast_fp16 = sigmoid(x = x_539_split_cast_fp16_1)[name = tensor("x_539_split_1_sigmoid_cast_fp16")]; tensor x_539_cast_fp16 = mul(x = x_539_split_cast_fp16_0, y = x_539_split_1_sigmoid_cast_fp16)[name = tensor("x_539_cast_fp16")]; tensor input_1093_cast_fp16 = select(a = var_44_to_fp16, b = x_539_cast_fp16, cond = var_575)[name = tensor("input_1093_cast_fp16")]; tensor new_x_83_interleave_0 = const()[name = tensor("new_x_83_interleave_0"), val = tensor(false)]; tensor new_x_83_cast_fp16 = concat(axis = var_59, interleave = new_x_83_interleave_0, values = (cache_83_cast_fp16, input_1093_cast_fp16))[name = tensor("new_x_83_cast_fp16")]; tensor var_4848_begin_0 = const()[name = tensor("op_4848_begin_0"), val = tensor([0, 0, 7])]; tensor var_4848_end_0 = const()[name = tensor("op_4848_end_0"), val = tensor([1, 1024, 15])]; tensor var_4848_end_mask_0 = const()[name = tensor("op_4848_end_mask_0"), val = tensor([true, true, true])]; tensor var_4848_cast_fp16 = slice_by_index(begin = var_4848_begin_0, end = var_4848_end_0, end_mask = var_4848_end_mask_0, x = new_x_83_cast_fp16)[name = tensor("op_4848_cast_fp16")]; tensor x_541_pad_type_0 = const()[name = tensor("x_541_pad_type_0"), val = tensor("valid")]; tensor x_541_groups_0 = const()[name = tensor("x_541_groups_0"), val = tensor(1024)]; tensor x_541_strides_0 = const()[name = tensor("x_541_strides_0"), val = tensor([1])]; tensor x_541_pad_0 = const()[name = tensor("x_541_pad_0"), val = tensor([0, 0])]; tensor x_541_dilations_0 = const()[name = tensor("x_541_dilations_0"), val = tensor([1])]; tensor encoder_layers_20_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421591232))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421600512))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_541_cast_fp16 = conv(dilations = x_541_dilations_0, groups = x_541_groups_0, pad = x_541_pad_0, pad_type = x_541_pad_type_0, strides = x_541_strides_0, weight = encoder_layers_20_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_83_cast_fp16)[name = tensor("x_541_cast_fp16")]; tensor input_1095_perm_0 = const()[name = tensor("input_1095_perm_0"), val = tensor([0, 2, 1])]; tensor x_543_axes_0 = const()[name = tensor("x_543_axes_0"), val = tensor([-1])]; tensor encoder_layers_20_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_20_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421602624)))]; tensor encoder_layers_20_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_20_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421604736)))]; tensor input_1095_cast_fp16 = transpose(perm = input_1095_perm_0, x = x_541_cast_fp16)[name = tensor("transpose_176")]; tensor x_543_cast_fp16 = layer_norm(axes = x_543_axes_0, beta = encoder_layers_20_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_20_conv_batch_norm_weight_to_fp16, x = input_1095_cast_fp16)[name = tensor("x_543_cast_fp16")]; tensor input_1097_perm_0 = const()[name = tensor("input_1097_perm_0"), val = tensor([0, 2, 1])]; tensor input_1097_cast_fp16 = transpose(perm = input_1097_perm_0, x = x_543_cast_fp16)[name = tensor("transpose_175")]; tensor input_1099_cast_fp16 = silu(x = input_1097_cast_fp16)[name = tensor("input_1099_cast_fp16")]; tensor x_545_pad_type_0 = const()[name = tensor("x_545_pad_type_0"), val = tensor("valid")]; tensor x_545_strides_0 = const()[name = tensor("x_545_strides_0"), val = tensor([1])]; tensor x_545_pad_0 = const()[name = tensor("x_545_pad_0"), val = tensor([0, 0])]; tensor x_545_dilations_0 = const()[name = tensor("x_545_dilations_0"), val = tensor([1])]; tensor x_545_groups_0 = const()[name = tensor("x_545_groups_0"), val = tensor(1)]; tensor encoder_layers_20_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421606848))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(422655488))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_545_cast_fp16 = conv(dilations = x_545_dilations_0, groups = x_545_groups_0, pad = x_545_pad_0, pad_type = x_545_pad_type_0, strides = x_545_strides_0, weight = encoder_layers_20_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_1099_cast_fp16)[name = tensor("x_545_cast_fp16")]; tensor input_1101_perm_0 = const()[name = tensor("input_1101_perm_0"), val = tensor([0, 2, 1])]; tensor input_1101_cast_fp16 = transpose(perm = input_1101_perm_0, x = x_545_cast_fp16)[name = tensor("transpose_174")]; tensor input_1103_cast_fp16 = add(x = input_1087_cast_fp16, y = input_1101_cast_fp16)[name = tensor("input_1103_cast_fp16")]; tensor input_1105_axes_0 = const()[name = tensor("input_1105_axes_0"), val = tensor([-1])]; tensor encoder_layers_20_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_20_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(422657600)))]; tensor encoder_layers_20_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_20_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(422659712)))]; tensor input_1105_cast_fp16 = layer_norm(axes = input_1105_axes_0, beta = encoder_layers_20_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_20_norm_feed_forward2_weight_to_fp16, x = input_1103_cast_fp16)[name = tensor("input_1105_cast_fp16")]; tensor encoder_layers_20_feed_forward2_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_feed_forward2_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(422661824))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(426856192))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_20_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_20_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(426864448)))]; tensor linear_188_cast_fp16 = linear(bias = encoder_layers_20_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_20_feed_forward2_linear1_weight_to_fp16_quantized, x = input_1105_cast_fp16)[name = tensor("linear_188_cast_fp16")]; tensor input_1109_cast_fp16 = silu(x = linear_188_cast_fp16)[name = tensor("input_1109_cast_fp16")]; tensor encoder_layers_20_feed_forward2_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_20_feed_forward2_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(426872704))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(431067072))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_20_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_20_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(431069184)))]; tensor linear_189_cast_fp16 = linear(bias = encoder_layers_20_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_20_feed_forward2_linear2_weight_to_fp16_quantized, x = input_1109_cast_fp16)[name = tensor("linear_189_cast_fp16")]; tensor var_4891_to_fp16 = const()[name = tensor("op_4891_to_fp16"), val = tensor(0x1p-1)]; tensor var_4892_cast_fp16 = mul(x = linear_189_cast_fp16, y = var_4891_to_fp16)[name = tensor("op_4892_cast_fp16")]; tensor input_1115_cast_fp16 = add(x = input_1103_cast_fp16, y = var_4892_cast_fp16)[name = tensor("input_1115_cast_fp16")]; tensor input_1117_axes_0 = const()[name = tensor("input_1117_axes_0"), val = tensor([-1])]; tensor encoder_layers_20_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_20_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(431071296)))]; tensor encoder_layers_20_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_20_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(431073408)))]; tensor input_1117_cast_fp16 = layer_norm(axes = input_1117_axes_0, beta = encoder_layers_20_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_20_norm_out_weight_to_fp16, x = input_1115_cast_fp16)[name = tensor("input_1117_cast_fp16")]; tensor cache_85_begin_0 = const()[name = tensor("cache_85_begin_0"), val = tensor([21, 0, 0, 0])]; tensor cache_85_end_0 = const()[name = tensor("cache_85_end_0"), val = tensor([22, 1, 42, 1024])]; tensor cache_85_end_mask_0 = const()[name = tensor("cache_85_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_85_squeeze_mask_0 = const()[name = tensor("cache_85_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_85_cast_fp16 = slice_by_index(begin = cache_85_begin_0, end = cache_85_end_0, end_mask = cache_85_end_mask_0, squeeze_mask = cache_85_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_85_cast_fp16")]; tensor cache_87_begin_0 = const()[name = tensor("cache_87_begin_0"), val = tensor([21, 0, 0, 0])]; tensor cache_87_end_0 = const()[name = tensor("cache_87_end_0"), val = tensor([22, 1, 1024, 8])]; tensor cache_87_end_mask_0 = const()[name = tensor("cache_87_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_87_squeeze_mask_0 = const()[name = tensor("cache_87_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_87_cast_fp16 = slice_by_index(begin = cache_87_begin_0, end = cache_87_end_0, end_mask = cache_87_end_mask_0, squeeze_mask = cache_87_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_87_cast_fp16")]; tensor input_1119_axes_0 = const()[name = tensor("input_1119_axes_0"), val = tensor([-1])]; tensor encoder_layers_21_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_21_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(431075520)))]; tensor encoder_layers_21_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_21_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(431077632)))]; tensor input_1119_cast_fp16 = layer_norm(axes = input_1119_axes_0, beta = encoder_layers_21_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_21_norm_feed_forward1_weight_to_fp16, x = input_1117_cast_fp16)[name = tensor("input_1119_cast_fp16")]; tensor encoder_layers_21_feed_forward1_linear1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_21_feed_forward1_linear1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(431079744))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(435274112))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8805056)))]; tensor encoder_layers_21_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_21_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(435282368)))]; tensor linear_190_cast_fp16 = linear(bias = encoder_layers_21_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_21_feed_forward1_linear1_weight_to_fp16_quantized, x = input_1119_cast_fp16)[name = tensor("linear_190_cast_fp16")]; tensor input_1123_cast_fp16 = silu(x = linear_190_cast_fp16)[name = tensor("input_1123_cast_fp16")]; tensor encoder_layers_21_feed_forward1_linear2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_21_feed_forward1_linear2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(435290624))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(439484992))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_21_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_21_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(439487104)))]; tensor linear_191_cast_fp16 = linear(bias = encoder_layers_21_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_21_feed_forward1_linear2_weight_to_fp16_quantized, x = input_1123_cast_fp16)[name = tensor("linear_191_cast_fp16")]; tensor var_4928_to_fp16 = const()[name = tensor("op_4928_to_fp16"), val = tensor(0x1p-1)]; tensor var_4929_cast_fp16 = mul(x = linear_191_cast_fp16, y = var_4928_to_fp16)[name = tensor("op_4929_cast_fp16")]; tensor input_1129_cast_fp16 = add(x = input_1117_cast_fp16, y = var_4929_cast_fp16)[name = tensor("input_1129_cast_fp16")]; tensor key_43_axes_0 = const()[name = tensor("key_43_axes_0"), val = tensor([-1])]; tensor encoder_layers_21_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_21_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(439489216)))]; tensor encoder_layers_21_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_21_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(439491328)))]; tensor key_43_cast_fp16 = layer_norm(axes = key_43_axes_0, beta = encoder_layers_21_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_21_norm_self_att_weight_to_fp16, x = input_1129_cast_fp16)[name = tensor("key_43_cast_fp16")]; tensor input_1131_interleave_0 = const()[name = tensor("input_1131_interleave_0"), val = tensor(false)]; tensor input_1131_cast_fp16 = concat(axis = var_68, interleave = input_1131_interleave_0, values = (cache_85_cast_fp16, key_43_cast_fp16))[name = tensor("input_1131_cast_fp16")]; tensor var_4951_begin_0 = const()[name = tensor("op_4951_begin_0"), val = tensor([0, 7, 0])]; tensor var_4951_end_0 = const()[name = tensor("op_4951_end_0"), val = tensor([1, 42, 1024])]; tensor var_4951_end_mask_0 = const()[name = tensor("op_4951_end_mask_0"), val = tensor([true, true, true])]; tensor var_4951_cast_fp16 = slice_by_index(begin = var_4951_begin_0, end = var_4951_end_0, end_mask = var_4951_end_mask_0, x = cache_85_cast_fp16)[name = tensor("op_4951_cast_fp16")]; tensor var_4957_interleave_0 = const()[name = tensor("op_4957_interleave_0"), val = tensor(false)]; tensor var_4957_cast_fp16 = concat(axis = var_68, interleave = var_4957_interleave_0, values = (var_4951_cast_fp16, key_43_cast_fp16))[name = tensor("op_4957_cast_fp16")]; tensor encoder_layers_21_self_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_21_self_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(439493440))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(440542080))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_21_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(440544192)))]; tensor linear_192_cast_fp16 = linear(bias = encoder_layers_21_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_21_self_attn_linear_q_weight_to_fp16_quantized, x = key_43_cast_fp16)[name = tensor("linear_192_cast_fp16")]; tensor var_4962 = const()[name = tensor("op_4962"), val = tensor([1, -1, 8, 128])]; tensor q_127_cast_fp16 = reshape(shape = var_4962, x = linear_192_cast_fp16)[name = tensor("q_127_cast_fp16")]; tensor encoder_layers_21_self_attn_linear_k_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_21_self_attn_linear_k_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(440546304))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(441594944))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_21_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(441597056)))]; tensor linear_193_cast_fp16 = linear(bias = encoder_layers_21_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_21_self_attn_linear_k_weight_to_fp16_quantized, x = input_1131_cast_fp16)[name = tensor("linear_193_cast_fp16")]; tensor var_4967 = const()[name = tensor("op_4967"), val = tensor([1, -1, 8, 128])]; tensor k_85_cast_fp16 = reshape(shape = var_4967, x = linear_193_cast_fp16)[name = tensor("k_85_cast_fp16")]; tensor encoder_layers_21_self_attn_linear_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_21_self_attn_linear_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(441599168))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442647808))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor encoder_layers_21_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442649920)))]; tensor linear_194_cast_fp16 = linear(bias = encoder_layers_21_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_21_self_attn_linear_v_weight_to_fp16_quantized, x = input_1131_cast_fp16)[name = tensor("linear_194_cast_fp16")]; tensor var_4972 = const()[name = tensor("op_4972"), val = tensor([1, -1, 8, 128])]; tensor v_43_cast_fp16 = reshape(shape = var_4972, x = linear_194_cast_fp16)[name = tensor("v_43_cast_fp16")]; tensor value_51_perm_0 = const()[name = tensor("value_51_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_21_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442652032)))]; tensor var_4985_cast_fp16 = add(x = q_127_cast_fp16, y = encoder_layers_21_self_attn_pos_bias_u_to_fp16)[name = tensor("op_4985_cast_fp16")]; tensor encoder_layers_21_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442654144)))]; tensor var_4987_cast_fp16 = add(x = q_127_cast_fp16, y = encoder_layers_21_self_attn_pos_bias_v_to_fp16)[name = tensor("op_4987_cast_fp16")]; tensor q_with_bias_v_43_perm_0 = const()[name = tensor("q_with_bias_v_43_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_553_transpose_x_0 = const()[name = tensor("x_553_transpose_x_0"), val = tensor(false)]; tensor x_553_transpose_y_0 = const()[name = tensor("x_553_transpose_y_0"), val = tensor(false)]; tensor op_4989_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_4989_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442656256))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442755840))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442755648)))]; tensor q_with_bias_v_43_cast_fp16 = transpose(perm = q_with_bias_v_43_perm_0, x = var_4987_cast_fp16)[name = tensor("transpose_173")]; tensor x_553_cast_fp16 = matmul(transpose_x = x_553_transpose_x_0, transpose_y = x_553_transpose_y_0, x = q_with_bias_v_43_cast_fp16, y = op_4989_to_fp16_quantized)[name = tensor("x_553_cast_fp16")]; tensor x_555_pad_0 = const()[name = tensor("x_555_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_555_mode_0 = const()[name = tensor("x_555_mode_0"), val = tensor("constant")]; tensor const_352_to_fp16 = const()[name = tensor("const_352_to_fp16"), val = tensor(0x0p+0)]; tensor x_555_cast_fp16 = pad(constant_val = const_352_to_fp16, mode = x_555_mode_0, pad = x_555_pad_0, x = x_553_cast_fp16)[name = tensor("x_555_cast_fp16")]; tensor var_4997 = const()[name = tensor("op_4997"), val = tensor([1, 8, -1, 7])]; tensor x_557_cast_fp16 = reshape(shape = var_4997, x = x_555_cast_fp16)[name = tensor("x_557_cast_fp16")]; tensor var_5001_begin_0 = const()[name = tensor("op_5001_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_5001_end_0 = const()[name = tensor("op_5001_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_5001_end_mask_0 = const()[name = tensor("op_5001_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_5001_cast_fp16 = slice_by_index(begin = var_5001_begin_0, end = var_5001_end_0, end_mask = var_5001_end_mask_0, x = x_557_cast_fp16)[name = tensor("op_5001_cast_fp16")]; tensor var_5002 = const()[name = tensor("op_5002"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_85_cast_fp16 = reshape(shape = var_5002, x = var_5001_cast_fp16)[name = tensor("matrix_bd_85_cast_fp16")]; tensor matrix_ac_43_transpose_x_0 = const()[name = tensor("matrix_ac_43_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_43_transpose_y_0 = const()[name = tensor("matrix_ac_43_transpose_y_0"), val = tensor(false)]; tensor transpose_138_perm_0 = const()[name = tensor("transpose_138_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_139_perm_0 = const()[name = tensor("transpose_139_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_139 = transpose(perm = transpose_139_perm_0, x = k_85_cast_fp16)[name = tensor("transpose_171")]; tensor transpose_138 = transpose(perm = transpose_138_perm_0, x = var_4985_cast_fp16)[name = tensor("transpose_172")]; tensor matrix_ac_43_cast_fp16 = matmul(transpose_x = matrix_ac_43_transpose_x_0, transpose_y = matrix_ac_43_transpose_y_0, x = transpose_138, y = transpose_139)[name = tensor("matrix_ac_43_cast_fp16")]; tensor matrix_bd_87_begin_0 = const()[name = tensor("matrix_bd_87_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_87_end_0 = const()[name = tensor("matrix_bd_87_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_87_end_mask_0 = const()[name = tensor("matrix_bd_87_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_87_cast_fp16 = slice_by_index(begin = matrix_bd_87_begin_0, end = matrix_bd_87_end_0, end_mask = matrix_bd_87_end_mask_0, x = matrix_bd_85_cast_fp16)[name = tensor("matrix_bd_87_cast_fp16")]; tensor var_5011_cast_fp16 = add(x = matrix_ac_43_cast_fp16, y = matrix_bd_87_cast_fp16)[name = tensor("op_5011_cast_fp16")]; tensor _inversed_scores_85_y_0_to_fp16 = const()[name = tensor("_inversed_scores_85_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_85_cast_fp16 = mul(x = var_5011_cast_fp16, y = _inversed_scores_85_y_0_to_fp16)[name = tensor("_inversed_scores_85_cast_fp16")]; tensor scores_87_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_85_cast_fp16, cond = mask_11)[name = tensor("scores_87_cast_fp16")]; tensor var_5017_cast_fp16 = softmax(axis = var_59, x = scores_87_cast_fp16)[name = tensor("op_5017_cast_fp16")]; tensor input_1133_cast_fp16 = select(a = var_44_to_fp16, b = var_5017_cast_fp16, cond = mask_11)[name = tensor("input_1133_cast_fp16")]; tensor x_559_transpose_x_0 = const()[name = tensor("x_559_transpose_x_0"), val = tensor(false)]; tensor x_559_transpose_y_0 = const()[name = tensor("x_559_transpose_y_0"), val = tensor(false)]; tensor value_51_cast_fp16 = transpose(perm = value_51_perm_0, x = v_43_cast_fp16)[name = tensor("transpose_170")]; tensor x_559_cast_fp16 = matmul(transpose_x = x_559_transpose_x_0, transpose_y = x_559_transpose_y_0, x = input_1133_cast_fp16, y = value_51_cast_fp16)[name = tensor("x_559_cast_fp16")]; tensor var_5021_perm_0 = const()[name = tensor("op_5021_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5022 = const()[name = tensor("op_5022"), val = tensor([1, -1, 1024])]; tensor var_5021_cast_fp16 = transpose(perm = var_5021_perm_0, x = x_559_cast_fp16)[name = tensor("transpose_169")]; tensor input_1135_cast_fp16 = reshape(shape = var_5022, x = var_5021_cast_fp16)[name = tensor("input_1135_cast_fp16")]; tensor encoder_layers_21_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442756160)))]; tensor encoder_layers_21_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444853376)))]; tensor linear_196_cast_fp16 = linear(bias = encoder_layers_21_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_21_self_attn_linear_out_weight_to_fp16, x = input_1135_cast_fp16)[name = tensor("linear_196_cast_fp16")]; tensor input_1139_cast_fp16 = add(x = input_1129_cast_fp16, y = linear_196_cast_fp16)[name = tensor("input_1139_cast_fp16")]; tensor x_563_axes_0 = const()[name = tensor("x_563_axes_0"), val = tensor([-1])]; tensor encoder_layers_21_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_21_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444855488)))]; tensor encoder_layers_21_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_21_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444857600)))]; tensor x_563_cast_fp16 = layer_norm(axes = x_563_axes_0, beta = encoder_layers_21_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_21_norm_conv_weight_to_fp16, x = input_1139_cast_fp16)[name = tensor("x_563_cast_fp16")]; tensor input_1141_perm_0 = const()[name = tensor("input_1141_perm_0"), val = tensor([0, 2, 1])]; tensor input_1143_pad_type_0 = const()[name = tensor("input_1143_pad_type_0"), val = tensor("valid")]; tensor input_1143_strides_0 = const()[name = tensor("input_1143_strides_0"), val = tensor([1])]; tensor input_1143_pad_0 = const()[name = tensor("input_1143_pad_0"), val = tensor([0, 0])]; tensor input_1143_dilations_0 = const()[name = tensor("input_1143_dilations_0"), val = tensor([1])]; tensor input_1143_groups_0 = const()[name = tensor("input_1143_groups_0"), val = tensor(1)]; tensor encoder_layers_21_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_21_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444859712))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446956928))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_1141_cast_fp16 = transpose(perm = input_1141_perm_0, x = x_563_cast_fp16)[name = tensor("transpose_168")]; tensor input_1143_cast_fp16 = conv(dilations = input_1143_dilations_0, groups = input_1143_groups_0, pad = input_1143_pad_0, pad_type = input_1143_pad_type_0, strides = input_1143_strides_0, weight = encoder_layers_21_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_1141_cast_fp16)[name = tensor("input_1143_cast_fp16")]; tensor x_565_split_num_splits_0 = const()[name = tensor("x_565_split_num_splits_0"), val = tensor(2)]; tensor x_565_split_axis_0 = const()[name = tensor("x_565_split_axis_0"), val = tensor(1)]; tensor x_565_split_cast_fp16_0, tensor x_565_split_cast_fp16_1 = split(axis = x_565_split_axis_0, num_splits = x_565_split_num_splits_0, x = input_1143_cast_fp16)[name = tensor("x_565_split_cast_fp16")]; tensor x_565_split_1_sigmoid_cast_fp16 = sigmoid(x = x_565_split_cast_fp16_1)[name = tensor("x_565_split_1_sigmoid_cast_fp16")]; tensor x_565_cast_fp16 = mul(x = x_565_split_cast_fp16_0, y = x_565_split_1_sigmoid_cast_fp16)[name = tensor("x_565_cast_fp16")]; tensor input_1145_cast_fp16 = select(a = var_44_to_fp16, b = x_565_cast_fp16, cond = var_575)[name = tensor("input_1145_cast_fp16")]; tensor new_x_87_interleave_0 = const()[name = tensor("new_x_87_interleave_0"), val = tensor(false)]; tensor new_x_87_cast_fp16 = concat(axis = var_59, interleave = new_x_87_interleave_0, values = (cache_87_cast_fp16, input_1145_cast_fp16))[name = tensor("new_x_87_cast_fp16")]; tensor var_5061_begin_0 = const()[name = tensor("op_5061_begin_0"), val = tensor([0, 0, 7])]; tensor var_5061_end_0 = const()[name = tensor("op_5061_end_0"), val = tensor([1, 1024, 15])]; tensor var_5061_end_mask_0 = const()[name = tensor("op_5061_end_mask_0"), val = tensor([true, true, true])]; tensor var_5061_cast_fp16 = slice_by_index(begin = var_5061_begin_0, end = var_5061_end_0, end_mask = var_5061_end_mask_0, x = new_x_87_cast_fp16)[name = tensor("op_5061_cast_fp16")]; tensor x_567_pad_type_0 = const()[name = tensor("x_567_pad_type_0"), val = tensor("valid")]; tensor x_567_groups_0 = const()[name = tensor("x_567_groups_0"), val = tensor(1024)]; tensor x_567_strides_0 = const()[name = tensor("x_567_strides_0"), val = tensor([1])]; tensor x_567_pad_0 = const()[name = tensor("x_567_pad_0"), val = tensor([0, 0])]; tensor x_567_dilations_0 = const()[name = tensor("x_567_dilations_0"), val = tensor([1])]; tensor encoder_layers_21_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_21_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446961088))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446970368))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_567_cast_fp16 = conv(dilations = x_567_dilations_0, groups = x_567_groups_0, pad = x_567_pad_0, pad_type = x_567_pad_type_0, strides = x_567_strides_0, weight = encoder_layers_21_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_87_cast_fp16)[name = tensor("x_567_cast_fp16")]; tensor input_1147_perm_0 = const()[name = tensor("input_1147_perm_0"), val = tensor([0, 2, 1])]; tensor x_569_axes_0 = const()[name = tensor("x_569_axes_0"), val = tensor([-1])]; tensor encoder_layers_21_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_21_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446972480)))]; tensor encoder_layers_21_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_21_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446974592)))]; tensor input_1147_cast_fp16 = transpose(perm = input_1147_perm_0, x = x_567_cast_fp16)[name = tensor("transpose_167")]; tensor x_569_cast_fp16 = layer_norm(axes = x_569_axes_0, beta = encoder_layers_21_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_21_conv_batch_norm_weight_to_fp16, x = input_1147_cast_fp16)[name = tensor("x_569_cast_fp16")]; tensor input_1149_perm_0 = const()[name = tensor("input_1149_perm_0"), val = tensor([0, 2, 1])]; tensor input_1149_cast_fp16 = transpose(perm = input_1149_perm_0, x = x_569_cast_fp16)[name = tensor("transpose_166")]; tensor input_1151_cast_fp16 = silu(x = input_1149_cast_fp16)[name = tensor("input_1151_cast_fp16")]; tensor x_571_pad_type_0 = const()[name = tensor("x_571_pad_type_0"), val = tensor("valid")]; tensor x_571_strides_0 = const()[name = tensor("x_571_strides_0"), val = tensor([1])]; tensor x_571_pad_0 = const()[name = tensor("x_571_pad_0"), val = tensor([0, 0])]; tensor x_571_dilations_0 = const()[name = tensor("x_571_dilations_0"), val = tensor([1])]; tensor x_571_groups_0 = const()[name = tensor("x_571_groups_0"), val = tensor(1)]; tensor encoder_layers_21_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_21_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446976704))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448025344))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_571_cast_fp16 = conv(dilations = x_571_dilations_0, groups = x_571_groups_0, pad = x_571_pad_0, pad_type = x_571_pad_type_0, strides = x_571_strides_0, weight = encoder_layers_21_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_1151_cast_fp16)[name = tensor("x_571_cast_fp16")]; tensor input_1153_perm_0 = const()[name = tensor("input_1153_perm_0"), val = tensor([0, 2, 1])]; tensor input_1153_cast_fp16 = transpose(perm = input_1153_perm_0, x = x_571_cast_fp16)[name = tensor("transpose_165")]; tensor input_1155_cast_fp16 = add(x = input_1139_cast_fp16, y = input_1153_cast_fp16)[name = tensor("input_1155_cast_fp16")]; tensor input_1157_axes_0 = const()[name = tensor("input_1157_axes_0"), val = tensor([-1])]; tensor encoder_layers_21_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_21_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448027456)))]; tensor encoder_layers_21_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_21_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448029568)))]; tensor input_1157_cast_fp16 = layer_norm(axes = input_1157_axes_0, beta = encoder_layers_21_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_21_norm_feed_forward2_weight_to_fp16, x = input_1155_cast_fp16)[name = tensor("input_1157_cast_fp16")]; tensor encoder_layers_21_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_21_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448031680)))]; tensor encoder_layers_21_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_21_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(456420352)))]; tensor linear_197_cast_fp16 = linear(bias = encoder_layers_21_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_21_feed_forward2_linear1_weight_to_fp16, x = input_1157_cast_fp16)[name = tensor("linear_197_cast_fp16")]; tensor input_1161_cast_fp16 = silu(x = linear_197_cast_fp16)[name = tensor("input_1161_cast_fp16")]; tensor encoder_layers_21_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_21_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(456428608)))]; tensor encoder_layers_21_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_21_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464817280)))]; tensor linear_198_cast_fp16 = linear(bias = encoder_layers_21_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_21_feed_forward2_linear2_weight_to_fp16, x = input_1161_cast_fp16)[name = tensor("linear_198_cast_fp16")]; tensor var_5104_to_fp16 = const()[name = tensor("op_5104_to_fp16"), val = tensor(0x1p-1)]; tensor var_5105_cast_fp16 = mul(x = linear_198_cast_fp16, y = var_5104_to_fp16)[name = tensor("op_5105_cast_fp16")]; tensor input_1167_cast_fp16 = add(x = input_1155_cast_fp16, y = var_5105_cast_fp16)[name = tensor("input_1167_cast_fp16")]; tensor input_1169_axes_0 = const()[name = tensor("input_1169_axes_0"), val = tensor([-1])]; tensor encoder_layers_21_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_21_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464819392)))]; tensor encoder_layers_21_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_21_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464821504)))]; tensor input_1169_cast_fp16 = layer_norm(axes = input_1169_axes_0, beta = encoder_layers_21_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_21_norm_out_weight_to_fp16, x = input_1167_cast_fp16)[name = tensor("input_1169_cast_fp16")]; tensor cache_89_begin_0 = const()[name = tensor("cache_89_begin_0"), val = tensor([22, 0, 0, 0])]; tensor cache_89_end_0 = const()[name = tensor("cache_89_end_0"), val = tensor([23, 1, 42, 1024])]; tensor cache_89_end_mask_0 = const()[name = tensor("cache_89_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_89_squeeze_mask_0 = const()[name = tensor("cache_89_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_89_cast_fp16 = slice_by_index(begin = cache_89_begin_0, end = cache_89_end_0, end_mask = cache_89_end_mask_0, squeeze_mask = cache_89_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_89_cast_fp16")]; tensor cache_91_begin_0 = const()[name = tensor("cache_91_begin_0"), val = tensor([22, 0, 0, 0])]; tensor cache_91_end_0 = const()[name = tensor("cache_91_end_0"), val = tensor([23, 1, 1024, 8])]; tensor cache_91_end_mask_0 = const()[name = tensor("cache_91_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_91_squeeze_mask_0 = const()[name = tensor("cache_91_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_91_cast_fp16 = slice_by_index(begin = cache_91_begin_0, end = cache_91_end_0, end_mask = cache_91_end_mask_0, squeeze_mask = cache_91_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_91_cast_fp16")]; tensor input_1171_axes_0 = const()[name = tensor("input_1171_axes_0"), val = tensor([-1])]; tensor encoder_layers_22_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_22_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464823616)))]; tensor encoder_layers_22_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_22_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464825728)))]; tensor input_1171_cast_fp16 = layer_norm(axes = input_1171_axes_0, beta = encoder_layers_22_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_22_norm_feed_forward1_weight_to_fp16, x = input_1169_cast_fp16)[name = tensor("input_1171_cast_fp16")]; tensor encoder_layers_22_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_22_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464827840)))]; tensor encoder_layers_22_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_22_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(473216512)))]; tensor linear_199_cast_fp16 = linear(bias = encoder_layers_22_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_22_feed_forward1_linear1_weight_to_fp16, x = input_1171_cast_fp16)[name = tensor("linear_199_cast_fp16")]; tensor input_1175_cast_fp16 = silu(x = linear_199_cast_fp16)[name = tensor("input_1175_cast_fp16")]; tensor encoder_layers_22_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_22_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(473224768)))]; tensor encoder_layers_22_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_22_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(481613440)))]; tensor linear_200_cast_fp16 = linear(bias = encoder_layers_22_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_22_feed_forward1_linear2_weight_to_fp16, x = input_1175_cast_fp16)[name = tensor("linear_200_cast_fp16")]; tensor var_5141_to_fp16 = const()[name = tensor("op_5141_to_fp16"), val = tensor(0x1p-1)]; tensor var_5142_cast_fp16 = mul(x = linear_200_cast_fp16, y = var_5141_to_fp16)[name = tensor("op_5142_cast_fp16")]; tensor input_1181_cast_fp16 = add(x = input_1169_cast_fp16, y = var_5142_cast_fp16)[name = tensor("input_1181_cast_fp16")]; tensor key_45_axes_0 = const()[name = tensor("key_45_axes_0"), val = tensor([-1])]; tensor encoder_layers_22_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_22_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(481615552)))]; tensor encoder_layers_22_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_22_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(481617664)))]; tensor key_45_cast_fp16 = layer_norm(axes = key_45_axes_0, beta = encoder_layers_22_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_22_norm_self_att_weight_to_fp16, x = input_1181_cast_fp16)[name = tensor("key_45_cast_fp16")]; tensor input_1183_interleave_0 = const()[name = tensor("input_1183_interleave_0"), val = tensor(false)]; tensor input_1183_cast_fp16 = concat(axis = var_68, interleave = input_1183_interleave_0, values = (cache_89_cast_fp16, key_45_cast_fp16))[name = tensor("input_1183_cast_fp16")]; tensor var_5164_begin_0 = const()[name = tensor("op_5164_begin_0"), val = tensor([0, 7, 0])]; tensor var_5164_end_0 = const()[name = tensor("op_5164_end_0"), val = tensor([1, 42, 1024])]; tensor var_5164_end_mask_0 = const()[name = tensor("op_5164_end_mask_0"), val = tensor([true, true, true])]; tensor var_5164_cast_fp16 = slice_by_index(begin = var_5164_begin_0, end = var_5164_end_0, end_mask = var_5164_end_mask_0, x = cache_89_cast_fp16)[name = tensor("op_5164_cast_fp16")]; tensor var_5170_interleave_0 = const()[name = tensor("op_5170_interleave_0"), val = tensor(false)]; tensor var_5170_cast_fp16 = concat(axis = var_68, interleave = var_5170_interleave_0, values = (var_5164_cast_fp16, key_45_cast_fp16))[name = tensor("op_5170_cast_fp16")]; tensor encoder_layers_22_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(481619776)))]; tensor encoder_layers_22_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(483716992)))]; tensor linear_201_cast_fp16 = linear(bias = encoder_layers_22_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_22_self_attn_linear_q_weight_to_fp16, x = key_45_cast_fp16)[name = tensor("linear_201_cast_fp16")]; tensor var_5175 = const()[name = tensor("op_5175"), val = tensor([1, -1, 8, 128])]; tensor q_133_cast_fp16 = reshape(shape = var_5175, x = linear_201_cast_fp16)[name = tensor("q_133_cast_fp16")]; tensor encoder_layers_22_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(483719104)))]; tensor encoder_layers_22_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(485816320)))]; tensor linear_202_cast_fp16 = linear(bias = encoder_layers_22_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_22_self_attn_linear_k_weight_to_fp16, x = input_1183_cast_fp16)[name = tensor("linear_202_cast_fp16")]; tensor var_5180 = const()[name = tensor("op_5180"), val = tensor([1, -1, 8, 128])]; tensor k_89_cast_fp16 = reshape(shape = var_5180, x = linear_202_cast_fp16)[name = tensor("k_89_cast_fp16")]; tensor encoder_layers_22_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(485818432)))]; tensor encoder_layers_22_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(487915648)))]; tensor linear_203_cast_fp16 = linear(bias = encoder_layers_22_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_22_self_attn_linear_v_weight_to_fp16, x = input_1183_cast_fp16)[name = tensor("linear_203_cast_fp16")]; tensor var_5185 = const()[name = tensor("op_5185"), val = tensor([1, -1, 8, 128])]; tensor v_45_cast_fp16 = reshape(shape = var_5185, x = linear_203_cast_fp16)[name = tensor("v_45_cast_fp16")]; tensor value_53_perm_0 = const()[name = tensor("value_53_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_22_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(487917760)))]; tensor var_5198_cast_fp16 = add(x = q_133_cast_fp16, y = encoder_layers_22_self_attn_pos_bias_u_to_fp16)[name = tensor("op_5198_cast_fp16")]; tensor encoder_layers_22_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(487919872)))]; tensor var_5200_cast_fp16 = add(x = q_133_cast_fp16, y = encoder_layers_22_self_attn_pos_bias_v_to_fp16)[name = tensor("op_5200_cast_fp16")]; tensor q_with_bias_v_45_perm_0 = const()[name = tensor("q_with_bias_v_45_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_579_transpose_x_0 = const()[name = tensor("x_579_transpose_x_0"), val = tensor(false)]; tensor x_579_transpose_y_0 = const()[name = tensor("x_579_transpose_y_0"), val = tensor(false)]; tensor op_5202_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_5202_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(487921984))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488021568))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488021376)))]; tensor q_with_bias_v_45_cast_fp16 = transpose(perm = q_with_bias_v_45_perm_0, x = var_5200_cast_fp16)[name = tensor("transpose_164")]; tensor x_579_cast_fp16 = matmul(transpose_x = x_579_transpose_x_0, transpose_y = x_579_transpose_y_0, x = q_with_bias_v_45_cast_fp16, y = op_5202_to_fp16_quantized)[name = tensor("x_579_cast_fp16")]; tensor x_581_pad_0 = const()[name = tensor("x_581_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_581_mode_0 = const()[name = tensor("x_581_mode_0"), val = tensor("constant")]; tensor const_365_to_fp16 = const()[name = tensor("const_365_to_fp16"), val = tensor(0x0p+0)]; tensor x_581_cast_fp16 = pad(constant_val = const_365_to_fp16, mode = x_581_mode_0, pad = x_581_pad_0, x = x_579_cast_fp16)[name = tensor("x_581_cast_fp16")]; tensor var_5210 = const()[name = tensor("op_5210"), val = tensor([1, 8, -1, 7])]; tensor x_583_cast_fp16 = reshape(shape = var_5210, x = x_581_cast_fp16)[name = tensor("x_583_cast_fp16")]; tensor var_5214_begin_0 = const()[name = tensor("op_5214_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_5214_end_0 = const()[name = tensor("op_5214_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_5214_end_mask_0 = const()[name = tensor("op_5214_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_5214_cast_fp16 = slice_by_index(begin = var_5214_begin_0, end = var_5214_end_0, end_mask = var_5214_end_mask_0, x = x_583_cast_fp16)[name = tensor("op_5214_cast_fp16")]; tensor var_5215 = const()[name = tensor("op_5215"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_89_cast_fp16 = reshape(shape = var_5215, x = var_5214_cast_fp16)[name = tensor("matrix_bd_89_cast_fp16")]; tensor matrix_ac_45_transpose_x_0 = const()[name = tensor("matrix_ac_45_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_45_transpose_y_0 = const()[name = tensor("matrix_ac_45_transpose_y_0"), val = tensor(false)]; tensor transpose_140_perm_0 = const()[name = tensor("transpose_140_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_141_perm_0 = const()[name = tensor("transpose_141_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_141 = transpose(perm = transpose_141_perm_0, x = k_89_cast_fp16)[name = tensor("transpose_162")]; tensor transpose_140 = transpose(perm = transpose_140_perm_0, x = var_5198_cast_fp16)[name = tensor("transpose_163")]; tensor matrix_ac_45_cast_fp16 = matmul(transpose_x = matrix_ac_45_transpose_x_0, transpose_y = matrix_ac_45_transpose_y_0, x = transpose_140, y = transpose_141)[name = tensor("matrix_ac_45_cast_fp16")]; tensor matrix_bd_91_begin_0 = const()[name = tensor("matrix_bd_91_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_91_end_0 = const()[name = tensor("matrix_bd_91_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_91_end_mask_0 = const()[name = tensor("matrix_bd_91_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_91_cast_fp16 = slice_by_index(begin = matrix_bd_91_begin_0, end = matrix_bd_91_end_0, end_mask = matrix_bd_91_end_mask_0, x = matrix_bd_89_cast_fp16)[name = tensor("matrix_bd_91_cast_fp16")]; tensor var_5224_cast_fp16 = add(x = matrix_ac_45_cast_fp16, y = matrix_bd_91_cast_fp16)[name = tensor("op_5224_cast_fp16")]; tensor _inversed_scores_89_y_0_to_fp16 = const()[name = tensor("_inversed_scores_89_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_89_cast_fp16 = mul(x = var_5224_cast_fp16, y = _inversed_scores_89_y_0_to_fp16)[name = tensor("_inversed_scores_89_cast_fp16")]; tensor scores_91_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_89_cast_fp16, cond = mask_11)[name = tensor("scores_91_cast_fp16")]; tensor var_5230_cast_fp16 = softmax(axis = var_59, x = scores_91_cast_fp16)[name = tensor("op_5230_cast_fp16")]; tensor input_1185_cast_fp16 = select(a = var_44_to_fp16, b = var_5230_cast_fp16, cond = mask_11)[name = tensor("input_1185_cast_fp16")]; tensor x_585_transpose_x_0 = const()[name = tensor("x_585_transpose_x_0"), val = tensor(false)]; tensor x_585_transpose_y_0 = const()[name = tensor("x_585_transpose_y_0"), val = tensor(false)]; tensor value_53_cast_fp16 = transpose(perm = value_53_perm_0, x = v_45_cast_fp16)[name = tensor("transpose_161")]; tensor x_585_cast_fp16 = matmul(transpose_x = x_585_transpose_x_0, transpose_y = x_585_transpose_y_0, x = input_1185_cast_fp16, y = value_53_cast_fp16)[name = tensor("x_585_cast_fp16")]; tensor var_5234_perm_0 = const()[name = tensor("op_5234_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5235 = const()[name = tensor("op_5235"), val = tensor([1, -1, 1024])]; tensor var_5234_cast_fp16 = transpose(perm = var_5234_perm_0, x = x_585_cast_fp16)[name = tensor("transpose_160")]; tensor input_1187_cast_fp16 = reshape(shape = var_5235, x = var_5234_cast_fp16)[name = tensor("input_1187_cast_fp16")]; tensor encoder_layers_22_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488021888)))]; tensor encoder_layers_22_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490119104)))]; tensor linear_205_cast_fp16 = linear(bias = encoder_layers_22_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_22_self_attn_linear_out_weight_to_fp16, x = input_1187_cast_fp16)[name = tensor("linear_205_cast_fp16")]; tensor input_1191_cast_fp16 = add(x = input_1181_cast_fp16, y = linear_205_cast_fp16)[name = tensor("input_1191_cast_fp16")]; tensor x_589_axes_0 = const()[name = tensor("x_589_axes_0"), val = tensor([-1])]; tensor encoder_layers_22_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_22_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490121216)))]; tensor encoder_layers_22_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_22_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490123328)))]; tensor x_589_cast_fp16 = layer_norm(axes = x_589_axes_0, beta = encoder_layers_22_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_22_norm_conv_weight_to_fp16, x = input_1191_cast_fp16)[name = tensor("x_589_cast_fp16")]; tensor input_1193_perm_0 = const()[name = tensor("input_1193_perm_0"), val = tensor([0, 2, 1])]; tensor input_1195_pad_type_0 = const()[name = tensor("input_1195_pad_type_0"), val = tensor("valid")]; tensor input_1195_strides_0 = const()[name = tensor("input_1195_strides_0"), val = tensor([1])]; tensor input_1195_pad_0 = const()[name = tensor("input_1195_pad_0"), val = tensor([0, 0])]; tensor input_1195_dilations_0 = const()[name = tensor("input_1195_dilations_0"), val = tensor([1])]; tensor input_1195_groups_0 = const()[name = tensor("input_1195_groups_0"), val = tensor(1)]; tensor encoder_layers_22_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_22_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490125440))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492222656))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_1193_cast_fp16 = transpose(perm = input_1193_perm_0, x = x_589_cast_fp16)[name = tensor("transpose_159")]; tensor input_1195_cast_fp16 = conv(dilations = input_1195_dilations_0, groups = input_1195_groups_0, pad = input_1195_pad_0, pad_type = input_1195_pad_type_0, strides = input_1195_strides_0, weight = encoder_layers_22_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_1193_cast_fp16)[name = tensor("input_1195_cast_fp16")]; tensor x_591_split_num_splits_0 = const()[name = tensor("x_591_split_num_splits_0"), val = tensor(2)]; tensor x_591_split_axis_0 = const()[name = tensor("x_591_split_axis_0"), val = tensor(1)]; tensor x_591_split_cast_fp16_0, tensor x_591_split_cast_fp16_1 = split(axis = x_591_split_axis_0, num_splits = x_591_split_num_splits_0, x = input_1195_cast_fp16)[name = tensor("x_591_split_cast_fp16")]; tensor x_591_split_1_sigmoid_cast_fp16 = sigmoid(x = x_591_split_cast_fp16_1)[name = tensor("x_591_split_1_sigmoid_cast_fp16")]; tensor x_591_cast_fp16 = mul(x = x_591_split_cast_fp16_0, y = x_591_split_1_sigmoid_cast_fp16)[name = tensor("x_591_cast_fp16")]; tensor input_1197_cast_fp16 = select(a = var_44_to_fp16, b = x_591_cast_fp16, cond = var_575)[name = tensor("input_1197_cast_fp16")]; tensor new_x_91_interleave_0 = const()[name = tensor("new_x_91_interleave_0"), val = tensor(false)]; tensor new_x_91_cast_fp16 = concat(axis = var_59, interleave = new_x_91_interleave_0, values = (cache_91_cast_fp16, input_1197_cast_fp16))[name = tensor("new_x_91_cast_fp16")]; tensor var_5274_begin_0 = const()[name = tensor("op_5274_begin_0"), val = tensor([0, 0, 7])]; tensor var_5274_end_0 = const()[name = tensor("op_5274_end_0"), val = tensor([1, 1024, 15])]; tensor var_5274_end_mask_0 = const()[name = tensor("op_5274_end_mask_0"), val = tensor([true, true, true])]; tensor var_5274_cast_fp16 = slice_by_index(begin = var_5274_begin_0, end = var_5274_end_0, end_mask = var_5274_end_mask_0, x = new_x_91_cast_fp16)[name = tensor("op_5274_cast_fp16")]; tensor x_593_pad_type_0 = const()[name = tensor("x_593_pad_type_0"), val = tensor("valid")]; tensor x_593_groups_0 = const()[name = tensor("x_593_groups_0"), val = tensor(1024)]; tensor x_593_strides_0 = const()[name = tensor("x_593_strides_0"), val = tensor([1])]; tensor x_593_pad_0 = const()[name = tensor("x_593_pad_0"), val = tensor([0, 0])]; tensor x_593_dilations_0 = const()[name = tensor("x_593_dilations_0"), val = tensor([1])]; tensor encoder_layers_22_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_22_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492226816))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492236096))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_593_cast_fp16 = conv(dilations = x_593_dilations_0, groups = x_593_groups_0, pad = x_593_pad_0, pad_type = x_593_pad_type_0, strides = x_593_strides_0, weight = encoder_layers_22_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_91_cast_fp16)[name = tensor("x_593_cast_fp16")]; tensor input_1199_perm_0 = const()[name = tensor("input_1199_perm_0"), val = tensor([0, 2, 1])]; tensor x_595_axes_0 = const()[name = tensor("x_595_axes_0"), val = tensor([-1])]; tensor encoder_layers_22_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_22_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492238208)))]; tensor encoder_layers_22_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_22_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492240320)))]; tensor input_1199_cast_fp16 = transpose(perm = input_1199_perm_0, x = x_593_cast_fp16)[name = tensor("transpose_158")]; tensor x_595_cast_fp16 = layer_norm(axes = x_595_axes_0, beta = encoder_layers_22_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_22_conv_batch_norm_weight_to_fp16, x = input_1199_cast_fp16)[name = tensor("x_595_cast_fp16")]; tensor input_1201_perm_0 = const()[name = tensor("input_1201_perm_0"), val = tensor([0, 2, 1])]; tensor input_1201_cast_fp16 = transpose(perm = input_1201_perm_0, x = x_595_cast_fp16)[name = tensor("transpose_157")]; tensor input_1203_cast_fp16 = silu(x = input_1201_cast_fp16)[name = tensor("input_1203_cast_fp16")]; tensor x_597_pad_type_0 = const()[name = tensor("x_597_pad_type_0"), val = tensor("valid")]; tensor x_597_strides_0 = const()[name = tensor("x_597_strides_0"), val = tensor([1])]; tensor x_597_pad_0 = const()[name = tensor("x_597_pad_0"), val = tensor([0, 0])]; tensor x_597_dilations_0 = const()[name = tensor("x_597_dilations_0"), val = tensor([1])]; tensor x_597_groups_0 = const()[name = tensor("x_597_groups_0"), val = tensor(1)]; tensor encoder_layers_22_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_22_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492242432))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(493291072))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_597_cast_fp16 = conv(dilations = x_597_dilations_0, groups = x_597_groups_0, pad = x_597_pad_0, pad_type = x_597_pad_type_0, strides = x_597_strides_0, weight = encoder_layers_22_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_1203_cast_fp16)[name = tensor("x_597_cast_fp16")]; tensor input_1205_perm_0 = const()[name = tensor("input_1205_perm_0"), val = tensor([0, 2, 1])]; tensor input_1205_cast_fp16 = transpose(perm = input_1205_perm_0, x = x_597_cast_fp16)[name = tensor("transpose_156")]; tensor input_1207_cast_fp16 = add(x = input_1191_cast_fp16, y = input_1205_cast_fp16)[name = tensor("input_1207_cast_fp16")]; tensor input_1209_axes_0 = const()[name = tensor("input_1209_axes_0"), val = tensor([-1])]; tensor encoder_layers_22_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_22_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(493293184)))]; tensor encoder_layers_22_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_22_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(493295296)))]; tensor input_1209_cast_fp16 = layer_norm(axes = input_1209_axes_0, beta = encoder_layers_22_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_22_norm_feed_forward2_weight_to_fp16, x = input_1207_cast_fp16)[name = tensor("input_1209_cast_fp16")]; tensor encoder_layers_22_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_22_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(493297408)))]; tensor encoder_layers_22_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_22_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(501686080)))]; tensor linear_206_cast_fp16 = linear(bias = encoder_layers_22_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_22_feed_forward2_linear1_weight_to_fp16, x = input_1209_cast_fp16)[name = tensor("linear_206_cast_fp16")]; tensor input_1213_cast_fp16 = silu(x = linear_206_cast_fp16)[name = tensor("input_1213_cast_fp16")]; tensor encoder_layers_22_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_22_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(501694336)))]; tensor encoder_layers_22_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_22_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(510083008)))]; tensor linear_207_cast_fp16 = linear(bias = encoder_layers_22_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_22_feed_forward2_linear2_weight_to_fp16, x = input_1213_cast_fp16)[name = tensor("linear_207_cast_fp16")]; tensor var_5317_to_fp16 = const()[name = tensor("op_5317_to_fp16"), val = tensor(0x1p-1)]; tensor var_5318_cast_fp16 = mul(x = linear_207_cast_fp16, y = var_5317_to_fp16)[name = tensor("op_5318_cast_fp16")]; tensor input_1219_cast_fp16 = add(x = input_1207_cast_fp16, y = var_5318_cast_fp16)[name = tensor("input_1219_cast_fp16")]; tensor input_1221_axes_0 = const()[name = tensor("input_1221_axes_0"), val = tensor([-1])]; tensor encoder_layers_22_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_22_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(510085120)))]; tensor encoder_layers_22_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_22_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(510087232)))]; tensor input_1221_cast_fp16 = layer_norm(axes = input_1221_axes_0, beta = encoder_layers_22_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_22_norm_out_weight_to_fp16, x = input_1219_cast_fp16)[name = tensor("input_1221_cast_fp16")]; tensor cache_93_begin_0 = const()[name = tensor("cache_93_begin_0"), val = tensor([23, 0, 0, 0])]; tensor cache_93_end_0 = const()[name = tensor("cache_93_end_0"), val = tensor([24, 1, 42, 1024])]; tensor cache_93_end_mask_0 = const()[name = tensor("cache_93_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_93_squeeze_mask_0 = const()[name = tensor("cache_93_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_93_cast_fp16 = slice_by_index(begin = cache_93_begin_0, end = cache_93_end_0, end_mask = cache_93_end_mask_0, squeeze_mask = cache_93_squeeze_mask_0, x = value_3_cast_fp16)[name = tensor("cache_93_cast_fp16")]; tensor cache_begin_0 = const()[name = tensor("cache_begin_0"), val = tensor([23, 0, 0, 0])]; tensor cache_end_0 = const()[name = tensor("cache_end_0"), val = tensor([24, 1, 1024, 8])]; tensor cache_end_mask_0 = const()[name = tensor("cache_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_squeeze_mask_0 = const()[name = tensor("cache_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_cast_fp16 = slice_by_index(begin = cache_begin_0, end = cache_end_0, end_mask = cache_end_mask_0, squeeze_mask = cache_squeeze_mask_0, x = value_5_cast_fp16)[name = tensor("cache_cast_fp16")]; tensor input_1223_axes_0 = const()[name = tensor("input_1223_axes_0"), val = tensor([-1])]; tensor encoder_layers_23_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_23_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(510089344)))]; tensor encoder_layers_23_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_23_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(510091456)))]; tensor input_1223_cast_fp16 = layer_norm(axes = input_1223_axes_0, beta = encoder_layers_23_norm_feed_forward1_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_23_norm_feed_forward1_weight_to_fp16, x = input_1221_cast_fp16)[name = tensor("input_1223_cast_fp16")]; tensor encoder_layers_23_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_23_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(510093568)))]; tensor encoder_layers_23_feed_forward1_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_23_feed_forward1_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(518482240)))]; tensor linear_208_cast_fp16 = linear(bias = encoder_layers_23_feed_forward1_linear1_bias_to_fp16, weight = encoder_layers_23_feed_forward1_linear1_weight_to_fp16, x = input_1223_cast_fp16)[name = tensor("linear_208_cast_fp16")]; tensor input_1227_cast_fp16 = silu(x = linear_208_cast_fp16)[name = tensor("input_1227_cast_fp16")]; tensor encoder_layers_23_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_23_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(518490496)))]; tensor encoder_layers_23_feed_forward1_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_23_feed_forward1_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526879168)))]; tensor linear_209_cast_fp16 = linear(bias = encoder_layers_23_feed_forward1_linear2_bias_to_fp16, weight = encoder_layers_23_feed_forward1_linear2_weight_to_fp16, x = input_1227_cast_fp16)[name = tensor("linear_209_cast_fp16")]; tensor var_5354_to_fp16 = const()[name = tensor("op_5354_to_fp16"), val = tensor(0x1p-1)]; tensor var_5355_cast_fp16 = mul(x = linear_209_cast_fp16, y = var_5354_to_fp16)[name = tensor("op_5355_cast_fp16")]; tensor input_1233_cast_fp16 = add(x = input_1221_cast_fp16, y = var_5355_cast_fp16)[name = tensor("input_1233_cast_fp16")]; tensor key_axes_0 = const()[name = tensor("key_axes_0"), val = tensor([-1])]; tensor encoder_layers_23_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_23_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526881280)))]; tensor encoder_layers_23_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_23_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526883392)))]; tensor key_cast_fp16 = layer_norm(axes = key_axes_0, beta = encoder_layers_23_norm_self_att_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_23_norm_self_att_weight_to_fp16, x = input_1233_cast_fp16)[name = tensor("key_cast_fp16")]; tensor input_1235_interleave_0 = const()[name = tensor("input_1235_interleave_0"), val = tensor(false)]; tensor input_1235_cast_fp16 = concat(axis = var_68, interleave = input_1235_interleave_0, values = (cache_93_cast_fp16, key_cast_fp16))[name = tensor("input_1235_cast_fp16")]; tensor var_5377_begin_0 = const()[name = tensor("op_5377_begin_0"), val = tensor([0, 7, 0])]; tensor var_5377_end_0 = const()[name = tensor("op_5377_end_0"), val = tensor([1, 42, 1024])]; tensor var_5377_end_mask_0 = const()[name = tensor("op_5377_end_mask_0"), val = tensor([true, true, true])]; tensor var_5377_cast_fp16 = slice_by_index(begin = var_5377_begin_0, end = var_5377_end_0, end_mask = var_5377_end_mask_0, x = cache_93_cast_fp16)[name = tensor("op_5377_cast_fp16")]; tensor cache_last_channel_cur_interleave_0 = const()[name = tensor("cache_last_channel_cur_interleave_0"), val = tensor(false)]; tensor cache_last_channel_cur_cast_fp16 = concat(axis = var_68, interleave = cache_last_channel_cur_interleave_0, values = (var_5377_cast_fp16, key_cast_fp16))[name = tensor("cache_last_channel_cur_cast_fp16")]; tensor encoder_layers_23_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526885504)))]; tensor encoder_layers_23_self_attn_linear_q_bias_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528982720)))]; tensor linear_210_cast_fp16 = linear(bias = encoder_layers_23_self_attn_linear_q_bias_to_fp16, weight = encoder_layers_23_self_attn_linear_q_weight_to_fp16, x = key_cast_fp16)[name = tensor("linear_210_cast_fp16")]; tensor var_5388 = const()[name = tensor("op_5388"), val = tensor([1, -1, 8, 128])]; tensor q_139_cast_fp16 = reshape(shape = var_5388, x = linear_210_cast_fp16)[name = tensor("q_139_cast_fp16")]; tensor encoder_layers_23_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528984832)))]; tensor encoder_layers_23_self_attn_linear_k_bias_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_linear_k_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(531082048)))]; tensor linear_211_cast_fp16 = linear(bias = encoder_layers_23_self_attn_linear_k_bias_to_fp16, weight = encoder_layers_23_self_attn_linear_k_weight_to_fp16, x = input_1235_cast_fp16)[name = tensor("linear_211_cast_fp16")]; tensor var_5393 = const()[name = tensor("op_5393"), val = tensor([1, -1, 8, 128])]; tensor k_93_cast_fp16 = reshape(shape = var_5393, x = linear_211_cast_fp16)[name = tensor("k_93_cast_fp16")]; tensor encoder_layers_23_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(531084160)))]; tensor encoder_layers_23_self_attn_linear_v_bias_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_linear_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533181376)))]; tensor linear_212_cast_fp16 = linear(bias = encoder_layers_23_self_attn_linear_v_bias_to_fp16, weight = encoder_layers_23_self_attn_linear_v_weight_to_fp16, x = input_1235_cast_fp16)[name = tensor("linear_212_cast_fp16")]; tensor var_5398 = const()[name = tensor("op_5398"), val = tensor([1, -1, 8, 128])]; tensor v_cast_fp16 = reshape(shape = var_5398, x = linear_212_cast_fp16)[name = tensor("v_cast_fp16")]; tensor value_perm_0 = const()[name = tensor("value_perm_0"), val = tensor([0, 2, -3, -1])]; tensor encoder_layers_23_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533183488)))]; tensor var_5411_cast_fp16 = add(x = q_139_cast_fp16, y = encoder_layers_23_self_attn_pos_bias_u_to_fp16)[name = tensor("op_5411_cast_fp16")]; tensor encoder_layers_23_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533185600)))]; tensor var_5413_cast_fp16 = add(x = q_139_cast_fp16, y = encoder_layers_23_self_attn_pos_bias_v_to_fp16)[name = tensor("op_5413_cast_fp16")]; tensor q_with_bias_v_perm_0 = const()[name = tensor("q_with_bias_v_perm_0"), val = tensor([0, 2, -3, -1])]; tensor x_605_transpose_x_0 = const()[name = tensor("x_605_transpose_x_0"), val = tensor(false)]; tensor x_605_transpose_y_0 = const()[name = tensor("x_605_transpose_y_0"), val = tensor(false)]; tensor op_5415_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(3), name = tensor("op_5415_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533187712))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533287296))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533287104)))]; tensor q_with_bias_v_cast_fp16 = transpose(perm = q_with_bias_v_perm_0, x = var_5413_cast_fp16)[name = tensor("transpose_155")]; tensor x_605_cast_fp16 = matmul(transpose_x = x_605_transpose_x_0, transpose_y = x_605_transpose_y_0, x = q_with_bias_v_cast_fp16, y = op_5415_to_fp16_quantized)[name = tensor("x_605_cast_fp16")]; tensor x_607_pad_0 = const()[name = tensor("x_607_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_607_mode_0 = const()[name = tensor("x_607_mode_0"), val = tensor("constant")]; tensor const_378_to_fp16 = const()[name = tensor("const_378_to_fp16"), val = tensor(0x0p+0)]; tensor x_607_cast_fp16 = pad(constant_val = const_378_to_fp16, mode = x_607_mode_0, pad = x_607_pad_0, x = x_605_cast_fp16)[name = tensor("x_607_cast_fp16")]; tensor var_5423 = const()[name = tensor("op_5423"), val = tensor([1, 8, -1, 7])]; tensor x_609_cast_fp16 = reshape(shape = var_5423, x = x_607_cast_fp16)[name = tensor("x_609_cast_fp16")]; tensor var_5427_begin_0 = const()[name = tensor("op_5427_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_5427_end_0 = const()[name = tensor("op_5427_end_0"), val = tensor([1, 8, 98, 7])]; tensor var_5427_end_mask_0 = const()[name = tensor("op_5427_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_5427_cast_fp16 = slice_by_index(begin = var_5427_begin_0, end = var_5427_end_0, end_mask = var_5427_end_mask_0, x = x_609_cast_fp16)[name = tensor("op_5427_cast_fp16")]; tensor var_5428 = const()[name = tensor("op_5428"), val = tensor([1, 8, 7, 97])]; tensor matrix_bd_93_cast_fp16 = reshape(shape = var_5428, x = var_5427_cast_fp16)[name = tensor("matrix_bd_93_cast_fp16")]; tensor matrix_ac_transpose_x_0 = const()[name = tensor("matrix_ac_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_transpose_y_0 = const()[name = tensor("matrix_ac_transpose_y_0"), val = tensor(false)]; tensor transpose_142_perm_0 = const()[name = tensor("transpose_142_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_143_perm_0 = const()[name = tensor("transpose_143_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_143 = transpose(perm = transpose_143_perm_0, x = k_93_cast_fp16)[name = tensor("transpose_153")]; tensor transpose_142 = transpose(perm = transpose_142_perm_0, x = var_5411_cast_fp16)[name = tensor("transpose_154")]; tensor matrix_ac_cast_fp16 = matmul(transpose_x = matrix_ac_transpose_x_0, transpose_y = matrix_ac_transpose_y_0, x = transpose_142, y = transpose_143)[name = tensor("matrix_ac_cast_fp16")]; tensor matrix_bd_begin_0 = const()[name = tensor("matrix_bd_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_end_0 = const()[name = tensor("matrix_bd_end_0"), val = tensor([1, 8, 7, 49])]; tensor matrix_bd_end_mask_0 = const()[name = tensor("matrix_bd_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_cast_fp16 = slice_by_index(begin = matrix_bd_begin_0, end = matrix_bd_end_0, end_mask = matrix_bd_end_mask_0, x = matrix_bd_93_cast_fp16)[name = tensor("matrix_bd_cast_fp16")]; tensor var_5437_cast_fp16 = add(x = matrix_ac_cast_fp16, y = matrix_bd_cast_fp16)[name = tensor("op_5437_cast_fp16")]; tensor _inversed_scores_93_y_0_to_fp16 = const()[name = tensor("_inversed_scores_93_y_0_to_fp16"), val = tensor(0x1.6ap-4)]; tensor _inversed_scores_93_cast_fp16 = mul(x = var_5437_cast_fp16, y = _inversed_scores_93_y_0_to_fp16)[name = tensor("_inversed_scores_93_cast_fp16")]; tensor scores_cast_fp16 = select(a = var_45_to_fp16, b = _inversed_scores_93_cast_fp16, cond = mask_11)[name = tensor("scores_cast_fp16")]; tensor var_5443_cast_fp16 = softmax(axis = var_59, x = scores_cast_fp16)[name = tensor("op_5443_cast_fp16")]; tensor input_1237_cast_fp16 = select(a = var_44_to_fp16, b = var_5443_cast_fp16, cond = mask_11)[name = tensor("input_1237_cast_fp16")]; tensor x_611_transpose_x_0 = const()[name = tensor("x_611_transpose_x_0"), val = tensor(false)]; tensor x_611_transpose_y_0 = const()[name = tensor("x_611_transpose_y_0"), val = tensor(false)]; tensor value_cast_fp16 = transpose(perm = value_perm_0, x = v_cast_fp16)[name = tensor("transpose_152")]; tensor x_611_cast_fp16 = matmul(transpose_x = x_611_transpose_x_0, transpose_y = x_611_transpose_y_0, x = input_1237_cast_fp16, y = value_cast_fp16)[name = tensor("x_611_cast_fp16")]; tensor var_5447_perm_0 = const()[name = tensor("op_5447_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_5448 = const()[name = tensor("op_5448"), val = tensor([1, -1, 1024])]; tensor var_5447_cast_fp16 = transpose(perm = var_5447_perm_0, x = x_611_cast_fp16)[name = tensor("transpose_151")]; tensor input_1239_cast_fp16 = reshape(shape = var_5448, x = var_5447_cast_fp16)[name = tensor("input_1239_cast_fp16")]; tensor encoder_layers_23_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533287616)))]; tensor encoder_layers_23_self_attn_linear_out_bias_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535384832)))]; tensor linear_214_cast_fp16 = linear(bias = encoder_layers_23_self_attn_linear_out_bias_to_fp16, weight = encoder_layers_23_self_attn_linear_out_weight_to_fp16, x = input_1239_cast_fp16)[name = tensor("linear_214_cast_fp16")]; tensor input_1243_cast_fp16 = add(x = input_1233_cast_fp16, y = linear_214_cast_fp16)[name = tensor("input_1243_cast_fp16")]; tensor x_615_axes_0 = const()[name = tensor("x_615_axes_0"), val = tensor([-1])]; tensor encoder_layers_23_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_23_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535386944)))]; tensor encoder_layers_23_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_23_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535389056)))]; tensor x_615_cast_fp16 = layer_norm(axes = x_615_axes_0, beta = encoder_layers_23_norm_conv_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_23_norm_conv_weight_to_fp16, x = input_1243_cast_fp16)[name = tensor("x_615_cast_fp16")]; tensor input_1245_perm_0 = const()[name = tensor("input_1245_perm_0"), val = tensor([0, 2, 1])]; tensor input_1247_pad_type_0 = const()[name = tensor("input_1247_pad_type_0"), val = tensor("valid")]; tensor input_1247_strides_0 = const()[name = tensor("input_1247_strides_0"), val = tensor([1])]; tensor input_1247_pad_0 = const()[name = tensor("input_1247_pad_0"), val = tensor([0, 0])]; tensor input_1247_dilations_0 = const()[name = tensor("input_1247_dilations_0"), val = tensor([1])]; tensor input_1247_groups_0 = const()[name = tensor("input_1247_groups_0"), val = tensor(1)]; tensor encoder_layers_23_conv_pointwise_conv1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_23_conv_pointwise_conv1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535391168))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537488384))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19445568)))]; tensor input_1245_cast_fp16 = transpose(perm = input_1245_perm_0, x = x_615_cast_fp16)[name = tensor("transpose_150")]; tensor input_1247_cast_fp16 = conv(dilations = input_1247_dilations_0, groups = input_1247_groups_0, pad = input_1247_pad_0, pad_type = input_1247_pad_type_0, strides = input_1247_strides_0, weight = encoder_layers_23_conv_pointwise_conv1_weight_to_fp16_quantized, x = input_1245_cast_fp16)[name = tensor("input_1247_cast_fp16")]; tensor x_617_split_num_splits_0 = const()[name = tensor("x_617_split_num_splits_0"), val = tensor(2)]; tensor x_617_split_axis_0 = const()[name = tensor("x_617_split_axis_0"), val = tensor(1)]; tensor x_617_split_cast_fp16_0, tensor x_617_split_cast_fp16_1 = split(axis = x_617_split_axis_0, num_splits = x_617_split_num_splits_0, x = input_1247_cast_fp16)[name = tensor("x_617_split_cast_fp16")]; tensor x_617_split_1_sigmoid_cast_fp16 = sigmoid(x = x_617_split_cast_fp16_1)[name = tensor("x_617_split_1_sigmoid_cast_fp16")]; tensor x_617_cast_fp16 = mul(x = x_617_split_cast_fp16_0, y = x_617_split_1_sigmoid_cast_fp16)[name = tensor("x_617_cast_fp16")]; tensor input_1249_cast_fp16 = select(a = var_44_to_fp16, b = x_617_cast_fp16, cond = var_575)[name = tensor("input_1249_cast_fp16")]; tensor new_x_interleave_0 = const()[name = tensor("new_x_interleave_0"), val = tensor(false)]; tensor new_x_cast_fp16 = concat(axis = var_59, interleave = new_x_interleave_0, values = (cache_cast_fp16, input_1249_cast_fp16))[name = tensor("new_x_cast_fp16")]; tensor cache_last_time_cur_begin_0 = const()[name = tensor("cache_last_time_cur_begin_0"), val = tensor([0, 0, 7])]; tensor cache_last_time_cur_end_0 = const()[name = tensor("cache_last_time_cur_end_0"), val = tensor([1, 1024, 15])]; tensor cache_last_time_cur_end_mask_0 = const()[name = tensor("cache_last_time_cur_end_mask_0"), val = tensor([true, true, true])]; tensor cache_last_time_cur_cast_fp16 = slice_by_index(begin = cache_last_time_cur_begin_0, end = cache_last_time_cur_end_0, end_mask = cache_last_time_cur_end_mask_0, x = new_x_cast_fp16)[name = tensor("cache_last_time_cur_cast_fp16")]; tensor x_619_pad_type_0 = const()[name = tensor("x_619_pad_type_0"), val = tensor("valid")]; tensor x_619_groups_0 = const()[name = tensor("x_619_groups_0"), val = tensor(1024)]; tensor x_619_strides_0 = const()[name = tensor("x_619_strides_0"), val = tensor([1])]; tensor x_619_pad_0 = const()[name = tensor("x_619_pad_0"), val = tensor([0, 0])]; tensor x_619_dilations_0 = const()[name = tensor("x_619_dilations_0"), val = tensor([1])]; tensor encoder_layers_23_conv_depthwise_conv_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_23_conv_depthwise_conv_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537492544))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537501824))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_619_cast_fp16 = conv(dilations = x_619_dilations_0, groups = x_619_groups_0, pad = x_619_pad_0, pad_type = x_619_pad_type_0, strides = x_619_strides_0, weight = encoder_layers_23_conv_depthwise_conv_weight_to_fp16_quantized, x = new_x_cast_fp16)[name = tensor("x_619_cast_fp16")]; tensor input_1251_perm_0 = const()[name = tensor("input_1251_perm_0"), val = tensor([0, 2, 1])]; tensor x_621_axes_0 = const()[name = tensor("x_621_axes_0"), val = tensor([-1])]; tensor encoder_layers_23_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_23_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537503936)))]; tensor encoder_layers_23_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_23_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537506048)))]; tensor input_1251_cast_fp16 = transpose(perm = input_1251_perm_0, x = x_619_cast_fp16)[name = tensor("transpose_149")]; tensor x_621_cast_fp16 = layer_norm(axes = x_621_axes_0, beta = encoder_layers_23_conv_batch_norm_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_23_conv_batch_norm_weight_to_fp16, x = input_1251_cast_fp16)[name = tensor("x_621_cast_fp16")]; tensor input_1253_perm_0 = const()[name = tensor("input_1253_perm_0"), val = tensor([0, 2, 1])]; tensor input_1253_cast_fp16 = transpose(perm = input_1253_perm_0, x = x_621_cast_fp16)[name = tensor("transpose_148")]; tensor input_1255_cast_fp16 = silu(x = input_1253_cast_fp16)[name = tensor("input_1255_cast_fp16")]; tensor x_623_pad_type_0 = const()[name = tensor("x_623_pad_type_0"), val = tensor("valid")]; tensor x_623_strides_0 = const()[name = tensor("x_623_strides_0"), val = tensor([1])]; tensor x_623_pad_0 = const()[name = tensor("x_623_pad_0"), val = tensor([0, 0])]; tensor x_623_dilations_0 = const()[name = tensor("x_623_dilations_0"), val = tensor([1])]; tensor x_623_groups_0 = const()[name = tensor("x_623_groups_0"), val = tensor(1)]; tensor encoder_layers_23_conv_pointwise_conv2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("encoder_layers_23_conv_pointwise_conv2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537508160))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538556800))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4600960)))]; tensor x_623_cast_fp16 = conv(dilations = x_623_dilations_0, groups = x_623_groups_0, pad = x_623_pad_0, pad_type = x_623_pad_type_0, strides = x_623_strides_0, weight = encoder_layers_23_conv_pointwise_conv2_weight_to_fp16_quantized, x = input_1255_cast_fp16)[name = tensor("x_623_cast_fp16")]; tensor input_1257_perm_0 = const()[name = tensor("input_1257_perm_0"), val = tensor([0, 2, 1])]; tensor input_1257_cast_fp16 = transpose(perm = input_1257_perm_0, x = x_623_cast_fp16)[name = tensor("transpose_147")]; tensor input_1259_cast_fp16 = add(x = input_1243_cast_fp16, y = input_1257_cast_fp16)[name = tensor("input_1259_cast_fp16")]; tensor input_1261_axes_0 = const()[name = tensor("input_1261_axes_0"), val = tensor([-1])]; tensor encoder_layers_23_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_23_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538558912)))]; tensor encoder_layers_23_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_23_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538561024)))]; tensor input_1261_cast_fp16 = layer_norm(axes = input_1261_axes_0, beta = encoder_layers_23_norm_feed_forward2_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_23_norm_feed_forward2_weight_to_fp16, x = input_1259_cast_fp16)[name = tensor("input_1261_cast_fp16")]; tensor encoder_layers_23_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_23_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538563136)))]; tensor encoder_layers_23_feed_forward2_linear1_bias_to_fp16 = const()[name = tensor("encoder_layers_23_feed_forward2_linear1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(546951808)))]; tensor linear_215_cast_fp16 = linear(bias = encoder_layers_23_feed_forward2_linear1_bias_to_fp16, weight = encoder_layers_23_feed_forward2_linear1_weight_to_fp16, x = input_1261_cast_fp16)[name = tensor("linear_215_cast_fp16")]; tensor input_1265_cast_fp16 = silu(x = linear_215_cast_fp16)[name = tensor("input_1265_cast_fp16")]; tensor encoder_layers_23_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_23_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(546960064)))]; tensor encoder_layers_23_feed_forward2_linear2_bias_to_fp16 = const()[name = tensor("encoder_layers_23_feed_forward2_linear2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(555348736)))]; tensor linear_216_cast_fp16 = linear(bias = encoder_layers_23_feed_forward2_linear2_bias_to_fp16, weight = encoder_layers_23_feed_forward2_linear2_weight_to_fp16, x = input_1265_cast_fp16)[name = tensor("linear_216_cast_fp16")]; tensor var_5530_to_fp16 = const()[name = tensor("op_5530_to_fp16"), val = tensor(0x1p-1)]; tensor var_5531_cast_fp16 = mul(x = linear_216_cast_fp16, y = var_5530_to_fp16)[name = tensor("op_5531_cast_fp16")]; tensor input_1271_cast_fp16 = add(x = input_1259_cast_fp16, y = var_5531_cast_fp16)[name = tensor("input_1271_cast_fp16")]; tensor audio_signal_axes_0 = const()[name = tensor("audio_signal_axes_0"), val = tensor([-1])]; tensor encoder_layers_23_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_23_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(555350848)))]; tensor encoder_layers_23_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_23_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(555352960)))]; tensor audio_signal_cast_fp16 = layer_norm(axes = audio_signal_axes_0, beta = encoder_layers_23_norm_out_bias_to_fp16, epsilon = var_42_to_fp16, gamma = encoder_layers_23_norm_out_weight_to_fp16, x = input_1271_cast_fp16)[name = tensor("audio_signal_cast_fp16")]; tensor obj_5_axis_0 = const()[name = tensor("obj_5_axis_0"), val = tensor(0)]; tensor obj_5_cast_fp16 = stack(axis = obj_5_axis_0, values = (var_484_cast_fp16, var_697_cast_fp16, var_910_cast_fp16, var_1123_cast_fp16, var_1336_cast_fp16, var_1549_cast_fp16, var_1762_cast_fp16, var_1975_cast_fp16, var_2188_cast_fp16, var_2401_cast_fp16, var_2614_cast_fp16, var_2827_cast_fp16, var_3040_cast_fp16, var_3253_cast_fp16, var_3466_cast_fp16, var_3679_cast_fp16, var_3892_cast_fp16, var_4105_cast_fp16, var_4318_cast_fp16, var_4531_cast_fp16, var_4744_cast_fp16, var_4957_cast_fp16, var_5170_cast_fp16, cache_last_channel_cur_cast_fp16))[name = tensor("obj_5_cast_fp16")]; tensor obj_7_axis_0 = const()[name = tensor("obj_7_axis_0"), val = tensor(0)]; tensor obj_7_cast_fp16 = stack(axis = obj_7_axis_0, values = (var_588_cast_fp16, var_801_cast_fp16, var_1014_cast_fp16, var_1227_cast_fp16, var_1440_cast_fp16, var_1653_cast_fp16, var_1866_cast_fp16, var_2079_cast_fp16, var_2292_cast_fp16, var_2505_cast_fp16, var_2718_cast_fp16, var_2931_cast_fp16, var_3144_cast_fp16, var_3357_cast_fp16, var_3570_cast_fp16, var_3783_cast_fp16, var_3996_cast_fp16, var_4209_cast_fp16, var_4422_cast_fp16, var_4635_cast_fp16, var_4848_cast_fp16, var_5061_cast_fp16, var_5274_cast_fp16, cache_last_time_cur_cast_fp16))[name = tensor("obj_7_cast_fp16")]; tensor var_5547 = add(x = cache_len, y = max_audio_length_1)[name = tensor("op_5547")]; tensor var_5547_promoted_to_fp16_dtype_0 = const()[name = tensor("op_5547_promoted_to_fp16_dtype_0"), val = tensor("fp16")]; tensor const_384_to_fp16 = const()[name = tensor("const_384_to_fp16"), val = tensor(-inf)]; tensor var_49_promoted_to_fp16 = const()[name = tensor("op_49_promoted_to_fp16"), val = tensor(0x1.5p+5)]; tensor var_5547_to_fp16 = cast(dtype = var_5547_promoted_to_fp16_dtype_0, x = var_5547)[name = tensor("cast_6")]; tensor clip_1_cast_fp16 = clip(alpha = const_384_to_fp16, beta = var_49_promoted_to_fp16, x = var_5547_to_fp16)[name = tensor("clip_1_cast_fp16")]; tensor var_5584 = const()[name = tensor("op_5584"), val = tensor(0)]; tensor one_hot_1_batch_dims_0 = const()[name = tensor("one_hot_1_batch_dims_0"), val = tensor(0)]; tensor one_hot_1_validate_indices_0 = const()[name = tensor("one_hot_1_validate_indices_0"), val = tensor(false)]; tensor to_onehot_identity_table_to_fp16 = const()[name = tensor("to_onehot_identity_table_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(555355072)))]; tensor prompt_id_to_int16_dtype_0 = const()[name = tensor("prompt_id_to_int16_dtype_0"), val = tensor("int16")]; tensor prompt_id_to_int16 = cast(dtype = prompt_id_to_int16_dtype_0, x = prompt_id)[name = tensor("cast_5")]; tensor one_hot_1_cast_fp16_cast_uint16 = gather(axis = var_5584, batch_dims = one_hot_1_batch_dims_0, indices = prompt_id_to_int16, validate_indices = one_hot_1_validate_indices_0, x = to_onehot_identity_table_to_fp16)[name = tensor("one_hot_1_cast_fp16_cast_uint16")]; tensor var_5593_axes_0 = const()[name = tensor("op_5593_axes_0"), val = tensor([1])]; tensor var_5593_cast_fp16 = expand_dims(axes = var_5593_axes_0, x = one_hot_1_cast_fp16_cast_uint16)[name = tensor("op_5593_cast_fp16")]; tensor one_hot_reps_0 = const()[name = tensor("one_hot_reps_0"), val = tensor([1, 7, 1])]; tensor one_hot_cast_fp16 = tile(reps = one_hot_reps_0, x = var_5593_cast_fp16)[name = tensor("one_hot_cast_fp16")]; tensor var_5602 = const()[name = tensor("op_5602"), val = tensor(-1)]; tensor input_1273_interleave_0 = const()[name = tensor("input_1273_interleave_0"), val = tensor(false)]; tensor input_1273_cast_fp16 = concat(axis = var_5602, interleave = input_1273_interleave_0, values = (audio_signal_cast_fp16, one_hot_cast_fp16))[name = tensor("input_1273_cast_fp16")]; tensor prompt_kernel_0_weight_to_fp16 = const()[name = tensor("prompt_kernel_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(555387904)))]; tensor prompt_kernel_0_bias_to_fp16 = const()[name = tensor("prompt_kernel_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(560106560)))]; tensor linear_217_cast_fp16 = linear(bias = prompt_kernel_0_bias_to_fp16, weight = prompt_kernel_0_weight_to_fp16, x = input_1273_cast_fp16)[name = tensor("linear_217_cast_fp16")]; tensor input_cast_fp16 = relu(x = linear_217_cast_fp16)[name = tensor("input_cast_fp16")]; tensor prompt_kernel_2_weight_to_fp16 = const()[name = tensor("prompt_kernel_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(560110720)))]; tensor prompt_kernel_2_bias_to_fp16 = const()[name = tensor("prompt_kernel_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(564305088)))]; tensor linear_218_cast_fp16 = linear(bias = prompt_kernel_2_bias_to_fp16, weight = prompt_kernel_2_weight_to_fp16, x = input_cast_fp16)[name = tensor("linear_218_cast_fp16")]; tensor var_5615_perm_0 = const()[name = tensor("op_5615_perm_0"), val = tensor([0, 2, 1])]; tensor var_5615_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_5615_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor cast_246_dtype_0 = const()[name = tensor("cast_246_dtype_0"), val = tensor("int32")]; tensor var_5623_perm_0 = const()[name = tensor("op_5623_perm_0"), val = tensor([1, 0, 2, 3])]; tensor var_5623_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_5623_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor var_5626_perm_0 = const()[name = tensor("op_5626_perm_0"), val = tensor([1, 0, 2, 3])]; tensor var_5626_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_5626_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor cast_247_dtype_0 = const()[name = tensor("cast_247_dtype_0"), val = tensor("int32")]; tensor cache_len_out = cast(dtype = cast_247_dtype_0, x = clip_1_cast_fp16)[name = tensor("cast_0")]; tensor var_5626_cast_fp16 = transpose(perm = var_5626_perm_0, x = obj_7_cast_fp16)[name = tensor("transpose_144")]; tensor cache_time_out = cast(dtype = var_5626_cast_fp16_to_fp32_dtype_0, x = var_5626_cast_fp16)[name = tensor("cast_1")]; tensor var_5623_cast_fp16 = transpose(perm = var_5623_perm_0, x = obj_5_cast_fp16)[name = tensor("transpose_145")]; tensor cache_channel_out = cast(dtype = var_5623_cast_fp16_to_fp32_dtype_0, x = var_5623_cast_fp16)[name = tensor("cast_2")]; tensor encoded_length = cast(dtype = cast_246_dtype_0, x = clip_0_cast_fp16)[name = tensor("cast_3")]; tensor var_5615_cast_fp16 = transpose(perm = var_5615_perm_0, x = linear_218_cast_fp16)[name = tensor("transpose_146")]; tensor encoded = cast(dtype = var_5615_cast_fp16_to_fp32_dtype_0, x = var_5615_cast_fp16)[name = tensor("cast_4")]; } -> (encoded, encoded_length, cache_channel_out, cache_time_out, cache_len_out); }