program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3500.14.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.2.2"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "8.3.0"}})] { func main(tensor logmel_data) { tensor var_28_pad_type_0 = const()[name = tensor("op_28_pad_type_0"), val = tensor("custom")]; tensor var_28_pad_0 = const()[name = tensor("op_28_pad_0"), val = tensor([1, 1])]; tensor var_28_strides_0 = const()[name = tensor("op_28_strides_0"), val = tensor([1])]; tensor var_28_dilations_0 = const()[name = tensor("op_28_dilations_0"), val = tensor([1])]; tensor var_28_groups_0 = const()[name = tensor("op_28_groups_0"), val = tensor(1)]; tensor logmel_data_to_fp16_dtype_0 = const()[name = tensor("logmel_data_to_fp16_dtype_0"), val = tensor("fp16")]; tensor const_0_to_fp16 = const()[name = tensor("const_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor const_1_to_fp16 = const()[name = tensor("const_1_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184448)))]; tensor logmel_data_to_fp16 = cast(dtype = logmel_data_to_fp16_dtype_0, x = logmel_data)[name = tensor("cast_20")]; tensor var_28_cast_fp16 = conv(bias = const_1_to_fp16, dilations = var_28_dilations_0, groups = var_28_groups_0, pad = var_28_pad_0, pad_type = var_28_pad_type_0, strides = var_28_strides_0, weight = const_0_to_fp16, x = logmel_data_to_fp16)[name = tensor("op_28_cast_fp16")]; tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast_fp16 = gelu(mode = input_1_mode_0, x = var_28_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_46_pad_type_0 = const()[name = tensor("op_46_pad_type_0"), val = tensor("custom")]; tensor var_46_pad_0 = const()[name = tensor("op_46_pad_0"), val = tensor([1, 1])]; tensor var_46_strides_0 = const()[name = tensor("op_46_strides_0"), val = tensor([2])]; tensor var_46_dilations_0 = const()[name = tensor("op_46_dilations_0"), val = tensor([1])]; tensor var_46_groups_0 = const()[name = tensor("op_46_groups_0"), val = tensor(1)]; tensor const_2_to_fp16 = const()[name = tensor("const_2_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185280)))]; tensor const_3_to_fp16 = const()[name = tensor("const_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1070080)))]; tensor var_46_cast_fp16 = conv(bias = const_3_to_fp16, dilations = var_46_dilations_0, groups = var_46_groups_0, pad = var_46_pad_0, pad_type = var_46_pad_type_0, strides = var_46_strides_0, weight = const_2_to_fp16, x = input_1_cast_fp16)[name = tensor("op_46_cast_fp16")]; tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; tensor x_3_cast_fp16 = gelu(mode = x_3_mode_0, x = var_46_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor var_51_to_fp16 = const()[name = tensor("op_51_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1070912)))]; tensor var_53_cast_fp16 = add(x = x_3_cast_fp16, y = var_51_to_fp16)[name = tensor("op_53_cast_fp16")]; tensor inputs_1_axes_0 = const()[name = tensor("inputs_1_axes_0"), val = tensor([2])]; tensor inputs_1_cast_fp16 = expand_dims(axes = inputs_1_axes_0, x = var_53_cast_fp16)[name = tensor("inputs_1_cast_fp16")]; tensor var_68 = const()[name = tensor("op_68"), val = tensor(1)]; tensor input_3_axes_0 = const()[name = tensor("input_3_axes_0"), val = tensor([1])]; tensor input_3_gamma_0_to_fp16 = const()[name = tensor("input_3_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2222976)))]; tensor input_3_beta_0_to_fp16 = const()[name = tensor("input_3_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2223808)))]; tensor var_84_to_fp16 = const()[name = tensor("op_84_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_3_cast_fp16 = layer_norm(axes = input_3_axes_0, beta = input_3_beta_0_to_fp16, epsilon = var_84_to_fp16, gamma = input_3_gamma_0_to_fp16, x = inputs_1_cast_fp16)[name = tensor("input_3_cast_fp16")]; tensor q_1_pad_type_0 = const()[name = tensor("q_1_pad_type_0"), val = tensor("valid")]; tensor q_1_strides_0 = const()[name = tensor("q_1_strides_0"), val = tensor([1, 1])]; tensor q_1_pad_0 = const()[name = tensor("q_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_1_dilations_0 = const()[name = tensor("q_1_dilations_0"), val = tensor([1, 1])]; tensor q_1_groups_0 = const()[name = tensor("q_1_groups_0"), val = tensor(1)]; tensor var_119_weight_0_to_fp16 = const()[name = tensor("op_119_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2224640)))]; tensor var_119_bias_0_to_fp16 = const()[name = tensor("op_119_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2519616)))]; tensor var_119_cast_fp16 = conv(bias = var_119_bias_0_to_fp16, dilations = q_1_dilations_0, groups = q_1_groups_0, pad = q_1_pad_0, pad_type = q_1_pad_type_0, strides = q_1_strides_0, weight = var_119_weight_0_to_fp16, x = input_3_cast_fp16)[name = tensor("op_119_cast_fp16")]; tensor k_1_pad_type_0 = const()[name = tensor("k_1_pad_type_0"), val = tensor("valid")]; tensor k_1_strides_0 = const()[name = tensor("k_1_strides_0"), val = tensor([1, 1])]; tensor k_1_pad_0 = const()[name = tensor("k_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_1_dilations_0 = const()[name = tensor("k_1_dilations_0"), val = tensor([1, 1])]; tensor k_1_groups_0 = const()[name = tensor("k_1_groups_0"), val = tensor(1)]; tensor blocks_0_attn_key_weight_to_fp16 = const()[name = tensor("blocks_0_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2520448)))]; tensor k_1_cast_fp16 = conv(dilations = k_1_dilations_0, groups = k_1_groups_0, pad = k_1_pad_0, pad_type = k_1_pad_type_0, strides = k_1_strides_0, weight = blocks_0_attn_key_weight_to_fp16, x = input_3_cast_fp16)[name = tensor("k_1_cast_fp16")]; tensor var_117_pad_type_0 = const()[name = tensor("op_117_pad_type_0"), val = tensor("valid")]; tensor var_117_strides_0 = const()[name = tensor("op_117_strides_0"), val = tensor([1, 1])]; tensor var_117_pad_0 = const()[name = tensor("op_117_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_117_dilations_0 = const()[name = tensor("op_117_dilations_0"), val = tensor([1, 1])]; tensor var_117_groups_0 = const()[name = tensor("op_117_groups_0"), val = tensor(1)]; tensor blocks_0_attn_value_weight_to_fp16 = const()[name = tensor("blocks_0_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2815424)))]; tensor blocks_0_attn_value_bias_to_fp16 = const()[name = tensor("blocks_0_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3110400)))]; tensor var_117_cast_fp16 = conv(bias = blocks_0_attn_value_bias_to_fp16, dilations = var_117_dilations_0, groups = var_117_groups_0, pad = var_117_pad_0, pad_type = var_117_pad_type_0, strides = var_117_strides_0, weight = blocks_0_attn_value_weight_to_fp16, x = input_3_cast_fp16)[name = tensor("op_117_cast_fp16")]; tensor tile_0 = const()[name = tensor("tile_0"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_120_axis_0 = const()[name = tensor("op_120_axis_0"), val = tensor(1)]; tensor var_120_cast_fp16_0, tensor var_120_cast_fp16_1, tensor var_120_cast_fp16_2, tensor var_120_cast_fp16_3, tensor var_120_cast_fp16_4, tensor var_120_cast_fp16_5 = split(axis = var_120_axis_0, split_sizes = tile_0, x = var_119_cast_fp16)[name = tensor("op_120_cast_fp16")]; tensor var_127_perm_0 = const()[name = tensor("op_127_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_1 = const()[name = tensor("tile_1"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_128_axis_0 = const()[name = tensor("op_128_axis_0"), val = tensor(3)]; tensor var_127_cast_fp16 = transpose(perm = var_127_perm_0, x = k_1_cast_fp16)[name = tensor("transpose_4")]; tensor var_128_cast_fp16_0, tensor var_128_cast_fp16_1, tensor var_128_cast_fp16_2, tensor var_128_cast_fp16_3, tensor var_128_cast_fp16_4, tensor var_128_cast_fp16_5 = split(axis = var_128_axis_0, split_sizes = tile_1, x = var_127_cast_fp16)[name = tensor("op_128_cast_fp16")]; tensor tile_2 = const()[name = tensor("tile_2"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_135_axis_0 = const()[name = tensor("op_135_axis_0"), val = tensor(1)]; tensor var_135_cast_fp16_0, tensor var_135_cast_fp16_1, tensor var_135_cast_fp16_2, tensor var_135_cast_fp16_3, tensor var_135_cast_fp16_4, tensor var_135_cast_fp16_5 = split(axis = var_135_axis_0, split_sizes = tile_2, x = var_117_cast_fp16)[name = tensor("op_135_cast_fp16")]; tensor aw_1_equation_0 = const()[name = tensor("aw_1_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1_cast_fp16 = einsum(equation = aw_1_equation_0, values = (var_128_cast_fp16_0, var_120_cast_fp16_0))[name = tensor("aw_1_cast_fp16")]; tensor aw_3_equation_0 = const()[name = tensor("aw_3_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_3_cast_fp16 = einsum(equation = aw_3_equation_0, values = (var_128_cast_fp16_1, var_120_cast_fp16_1))[name = tensor("aw_3_cast_fp16")]; tensor aw_5_equation_0 = const()[name = tensor("aw_5_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_5_cast_fp16 = einsum(equation = aw_5_equation_0, values = (var_128_cast_fp16_2, var_120_cast_fp16_2))[name = tensor("aw_5_cast_fp16")]; tensor aw_7_equation_0 = const()[name = tensor("aw_7_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_7_cast_fp16 = einsum(equation = aw_7_equation_0, values = (var_128_cast_fp16_3, var_120_cast_fp16_3))[name = tensor("aw_7_cast_fp16")]; tensor aw_9_equation_0 = const()[name = tensor("aw_9_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_9_cast_fp16 = einsum(equation = aw_9_equation_0, values = (var_128_cast_fp16_4, var_120_cast_fp16_4))[name = tensor("aw_9_cast_fp16")]; tensor aw_11_equation_0 = const()[name = tensor("aw_11_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_11_cast_fp16 = einsum(equation = aw_11_equation_0, values = (var_128_cast_fp16_5, var_120_cast_fp16_5))[name = tensor("aw_11_cast_fp16")]; tensor var_154_cast_fp16 = softmax(axis = var_68, x = aw_1_cast_fp16)[name = tensor("op_154_cast_fp16")]; tensor var_155_cast_fp16 = softmax(axis = var_68, x = aw_3_cast_fp16)[name = tensor("op_155_cast_fp16")]; tensor var_156_cast_fp16 = softmax(axis = var_68, x = aw_5_cast_fp16)[name = tensor("op_156_cast_fp16")]; tensor var_157_cast_fp16 = softmax(axis = var_68, x = aw_7_cast_fp16)[name = tensor("op_157_cast_fp16")]; tensor var_158_cast_fp16 = softmax(axis = var_68, x = aw_9_cast_fp16)[name = tensor("op_158_cast_fp16")]; tensor var_159_cast_fp16 = softmax(axis = var_68, x = aw_11_cast_fp16)[name = tensor("op_159_cast_fp16")]; tensor var_161_equation_0 = const()[name = tensor("op_161_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_161_cast_fp16 = einsum(equation = var_161_equation_0, values = (var_135_cast_fp16_0, var_154_cast_fp16))[name = tensor("op_161_cast_fp16")]; tensor var_163_equation_0 = const()[name = tensor("op_163_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_163_cast_fp16 = einsum(equation = var_163_equation_0, values = (var_135_cast_fp16_1, var_155_cast_fp16))[name = tensor("op_163_cast_fp16")]; tensor var_165_equation_0 = const()[name = tensor("op_165_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_165_cast_fp16 = einsum(equation = var_165_equation_0, values = (var_135_cast_fp16_2, var_156_cast_fp16))[name = tensor("op_165_cast_fp16")]; tensor var_167_equation_0 = const()[name = tensor("op_167_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_167_cast_fp16 = einsum(equation = var_167_equation_0, values = (var_135_cast_fp16_3, var_157_cast_fp16))[name = tensor("op_167_cast_fp16")]; tensor var_169_equation_0 = const()[name = tensor("op_169_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_169_cast_fp16 = einsum(equation = var_169_equation_0, values = (var_135_cast_fp16_4, var_158_cast_fp16))[name = tensor("op_169_cast_fp16")]; tensor var_171_equation_0 = const()[name = tensor("op_171_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_171_cast_fp16 = einsum(equation = var_171_equation_0, values = (var_135_cast_fp16_5, var_159_cast_fp16))[name = tensor("op_171_cast_fp16")]; tensor input_5_interleave_0 = const()[name = tensor("input_5_interleave_0"), val = tensor(false)]; tensor input_5_cast_fp16 = concat(axis = var_68, interleave = input_5_interleave_0, values = (var_161_cast_fp16, var_163_cast_fp16, var_165_cast_fp16, var_167_cast_fp16, var_169_cast_fp16, var_171_cast_fp16))[name = tensor("input_5_cast_fp16")]; tensor var_180_pad_type_0 = const()[name = tensor("op_180_pad_type_0"), val = tensor("valid")]; tensor var_180_strides_0 = const()[name = tensor("op_180_strides_0"), val = tensor([1, 1])]; tensor var_180_pad_0 = const()[name = tensor("op_180_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_180_dilations_0 = const()[name = tensor("op_180_dilations_0"), val = tensor([1, 1])]; tensor var_180_groups_0 = const()[name = tensor("op_180_groups_0"), val = tensor(1)]; tensor blocks_0_attn_out_weight_to_fp16 = const()[name = tensor("blocks_0_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3111232)))]; tensor blocks_0_attn_out_bias_to_fp16 = const()[name = tensor("blocks_0_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3406208)))]; tensor var_180_cast_fp16 = conv(bias = blocks_0_attn_out_bias_to_fp16, dilations = var_180_dilations_0, groups = var_180_groups_0, pad = var_180_pad_0, pad_type = var_180_pad_type_0, strides = var_180_strides_0, weight = blocks_0_attn_out_weight_to_fp16, x = input_5_cast_fp16)[name = tensor("op_180_cast_fp16")]; tensor inputs_3_cast_fp16 = add(x = inputs_1_cast_fp16, y = var_180_cast_fp16)[name = tensor("inputs_3_cast_fp16")]; tensor input_7_axes_0 = const()[name = tensor("input_7_axes_0"), val = tensor([1])]; tensor input_7_gamma_0_to_fp16 = const()[name = tensor("input_7_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3407040)))]; tensor input_7_beta_0_to_fp16 = const()[name = tensor("input_7_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3407872)))]; tensor var_190_to_fp16 = const()[name = tensor("op_190_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_7_cast_fp16 = layer_norm(axes = input_7_axes_0, beta = input_7_beta_0_to_fp16, epsilon = var_190_to_fp16, gamma = input_7_gamma_0_to_fp16, x = inputs_3_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor input_9_pad_type_0 = const()[name = tensor("input_9_pad_type_0"), val = tensor("valid")]; tensor input_9_strides_0 = const()[name = tensor("input_9_strides_0"), val = tensor([1, 1])]; tensor input_9_pad_0 = const()[name = tensor("input_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_9_dilations_0 = const()[name = tensor("input_9_dilations_0"), val = tensor([1, 1])]; tensor input_9_groups_0 = const()[name = tensor("input_9_groups_0"), val = tensor(1)]; tensor blocks_0_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3408704)))]; tensor blocks_0_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4588416)))]; tensor input_9_cast_fp16 = conv(bias = blocks_0_mlp_0_bias_to_fp16, dilations = input_9_dilations_0, groups = input_9_groups_0, pad = input_9_pad_0, pad_type = input_9_pad_type_0, strides = input_9_strides_0, weight = blocks_0_mlp_0_weight_to_fp16, x = input_7_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor input_11_mode_0 = const()[name = tensor("input_11_mode_0"), val = tensor("EXACT")]; tensor input_11_cast_fp16 = gelu(mode = input_11_mode_0, x = input_9_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor var_216_pad_type_0 = const()[name = tensor("op_216_pad_type_0"), val = tensor("valid")]; tensor var_216_strides_0 = const()[name = tensor("op_216_strides_0"), val = tensor([1, 1])]; tensor var_216_pad_0 = const()[name = tensor("op_216_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_216_dilations_0 = const()[name = tensor("op_216_dilations_0"), val = tensor([1, 1])]; tensor var_216_groups_0 = const()[name = tensor("op_216_groups_0"), val = tensor(1)]; tensor blocks_0_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4591552)))]; tensor blocks_0_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5771264)))]; tensor var_216_cast_fp16 = conv(bias = blocks_0_mlp_2_bias_to_fp16, dilations = var_216_dilations_0, groups = var_216_groups_0, pad = var_216_pad_0, pad_type = var_216_pad_type_0, strides = var_216_strides_0, weight = blocks_0_mlp_2_weight_to_fp16, x = input_11_cast_fp16)[name = tensor("op_216_cast_fp16")]; tensor inputs_5_cast_fp16 = add(x = inputs_3_cast_fp16, y = var_216_cast_fp16)[name = tensor("inputs_5_cast_fp16")]; tensor var_225 = const()[name = tensor("op_225"), val = tensor(1)]; tensor input_13_axes_0 = const()[name = tensor("input_13_axes_0"), val = tensor([1])]; tensor input_13_gamma_0_to_fp16 = const()[name = tensor("input_13_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5772096)))]; tensor input_13_beta_0_to_fp16 = const()[name = tensor("input_13_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5772928)))]; tensor var_241_to_fp16 = const()[name = tensor("op_241_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_13_cast_fp16 = layer_norm(axes = input_13_axes_0, beta = input_13_beta_0_to_fp16, epsilon = var_241_to_fp16, gamma = input_13_gamma_0_to_fp16, x = inputs_5_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor q_3_pad_type_0 = const()[name = tensor("q_3_pad_type_0"), val = tensor("valid")]; tensor q_3_strides_0 = const()[name = tensor("q_3_strides_0"), val = tensor([1, 1])]; tensor q_3_pad_0 = const()[name = tensor("q_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_3_dilations_0 = const()[name = tensor("q_3_dilations_0"), val = tensor([1, 1])]; tensor q_3_groups_0 = const()[name = tensor("q_3_groups_0"), val = tensor(1)]; tensor var_276_weight_0_to_fp16 = const()[name = tensor("op_276_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5773760)))]; tensor var_276_bias_0_to_fp16 = const()[name = tensor("op_276_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6068736)))]; tensor var_276_cast_fp16 = conv(bias = var_276_bias_0_to_fp16, dilations = q_3_dilations_0, groups = q_3_groups_0, pad = q_3_pad_0, pad_type = q_3_pad_type_0, strides = q_3_strides_0, weight = var_276_weight_0_to_fp16, x = input_13_cast_fp16)[name = tensor("op_276_cast_fp16")]; tensor k_3_pad_type_0 = const()[name = tensor("k_3_pad_type_0"), val = tensor("valid")]; tensor k_3_strides_0 = const()[name = tensor("k_3_strides_0"), val = tensor([1, 1])]; tensor k_3_pad_0 = const()[name = tensor("k_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_3_dilations_0 = const()[name = tensor("k_3_dilations_0"), val = tensor([1, 1])]; tensor k_3_groups_0 = const()[name = tensor("k_3_groups_0"), val = tensor(1)]; tensor blocks_1_attn_key_weight_to_fp16 = const()[name = tensor("blocks_1_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6069568)))]; tensor k_3_cast_fp16 = conv(dilations = k_3_dilations_0, groups = k_3_groups_0, pad = k_3_pad_0, pad_type = k_3_pad_type_0, strides = k_3_strides_0, weight = blocks_1_attn_key_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("k_3_cast_fp16")]; tensor var_274_pad_type_0 = const()[name = tensor("op_274_pad_type_0"), val = tensor("valid")]; tensor var_274_strides_0 = const()[name = tensor("op_274_strides_0"), val = tensor([1, 1])]; tensor var_274_pad_0 = const()[name = tensor("op_274_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_274_dilations_0 = const()[name = tensor("op_274_dilations_0"), val = tensor([1, 1])]; tensor var_274_groups_0 = const()[name = tensor("op_274_groups_0"), val = tensor(1)]; tensor blocks_1_attn_value_weight_to_fp16 = const()[name = tensor("blocks_1_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6364544)))]; tensor blocks_1_attn_value_bias_to_fp16 = const()[name = tensor("blocks_1_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6659520)))]; tensor var_274_cast_fp16 = conv(bias = blocks_1_attn_value_bias_to_fp16, dilations = var_274_dilations_0, groups = var_274_groups_0, pad = var_274_pad_0, pad_type = var_274_pad_type_0, strides = var_274_strides_0, weight = blocks_1_attn_value_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("op_274_cast_fp16")]; tensor tile_3 = const()[name = tensor("tile_3"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_277_axis_0 = const()[name = tensor("op_277_axis_0"), val = tensor(1)]; tensor var_277_cast_fp16_0, tensor var_277_cast_fp16_1, tensor var_277_cast_fp16_2, tensor var_277_cast_fp16_3, tensor var_277_cast_fp16_4, tensor var_277_cast_fp16_5 = split(axis = var_277_axis_0, split_sizes = tile_3, x = var_276_cast_fp16)[name = tensor("op_277_cast_fp16")]; tensor var_284_perm_0 = const()[name = tensor("op_284_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_4 = const()[name = tensor("tile_4"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_285_axis_0 = const()[name = tensor("op_285_axis_0"), val = tensor(3)]; tensor var_284_cast_fp16 = transpose(perm = var_284_perm_0, x = k_3_cast_fp16)[name = tensor("transpose_3")]; tensor var_285_cast_fp16_0, tensor var_285_cast_fp16_1, tensor var_285_cast_fp16_2, tensor var_285_cast_fp16_3, tensor var_285_cast_fp16_4, tensor var_285_cast_fp16_5 = split(axis = var_285_axis_0, split_sizes = tile_4, x = var_284_cast_fp16)[name = tensor("op_285_cast_fp16")]; tensor tile_5 = const()[name = tensor("tile_5"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_292_axis_0 = const()[name = tensor("op_292_axis_0"), val = tensor(1)]; tensor var_292_cast_fp16_0, tensor var_292_cast_fp16_1, tensor var_292_cast_fp16_2, tensor var_292_cast_fp16_3, tensor var_292_cast_fp16_4, tensor var_292_cast_fp16_5 = split(axis = var_292_axis_0, split_sizes = tile_5, x = var_274_cast_fp16)[name = tensor("op_292_cast_fp16")]; tensor aw_13_equation_0 = const()[name = tensor("aw_13_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_13_cast_fp16 = einsum(equation = aw_13_equation_0, values = (var_285_cast_fp16_0, var_277_cast_fp16_0))[name = tensor("aw_13_cast_fp16")]; tensor aw_15_equation_0 = const()[name = tensor("aw_15_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_15_cast_fp16 = einsum(equation = aw_15_equation_0, values = (var_285_cast_fp16_1, var_277_cast_fp16_1))[name = tensor("aw_15_cast_fp16")]; tensor aw_17_equation_0 = const()[name = tensor("aw_17_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_17_cast_fp16 = einsum(equation = aw_17_equation_0, values = (var_285_cast_fp16_2, var_277_cast_fp16_2))[name = tensor("aw_17_cast_fp16")]; tensor aw_19_equation_0 = const()[name = tensor("aw_19_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_19_cast_fp16 = einsum(equation = aw_19_equation_0, values = (var_285_cast_fp16_3, var_277_cast_fp16_3))[name = tensor("aw_19_cast_fp16")]; tensor aw_21_equation_0 = const()[name = tensor("aw_21_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_21_cast_fp16 = einsum(equation = aw_21_equation_0, values = (var_285_cast_fp16_4, var_277_cast_fp16_4))[name = tensor("aw_21_cast_fp16")]; tensor aw_23_equation_0 = const()[name = tensor("aw_23_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_23_cast_fp16 = einsum(equation = aw_23_equation_0, values = (var_285_cast_fp16_5, var_277_cast_fp16_5))[name = tensor("aw_23_cast_fp16")]; tensor var_311_cast_fp16 = softmax(axis = var_225, x = aw_13_cast_fp16)[name = tensor("op_311_cast_fp16")]; tensor var_312_cast_fp16 = softmax(axis = var_225, x = aw_15_cast_fp16)[name = tensor("op_312_cast_fp16")]; tensor var_313_cast_fp16 = softmax(axis = var_225, x = aw_17_cast_fp16)[name = tensor("op_313_cast_fp16")]; tensor var_314_cast_fp16 = softmax(axis = var_225, x = aw_19_cast_fp16)[name = tensor("op_314_cast_fp16")]; tensor var_315_cast_fp16 = softmax(axis = var_225, x = aw_21_cast_fp16)[name = tensor("op_315_cast_fp16")]; tensor var_316_cast_fp16 = softmax(axis = var_225, x = aw_23_cast_fp16)[name = tensor("op_316_cast_fp16")]; tensor var_318_equation_0 = const()[name = tensor("op_318_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_318_cast_fp16 = einsum(equation = var_318_equation_0, values = (var_292_cast_fp16_0, var_311_cast_fp16))[name = tensor("op_318_cast_fp16")]; tensor var_320_equation_0 = const()[name = tensor("op_320_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_320_cast_fp16 = einsum(equation = var_320_equation_0, values = (var_292_cast_fp16_1, var_312_cast_fp16))[name = tensor("op_320_cast_fp16")]; tensor var_322_equation_0 = const()[name = tensor("op_322_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_322_cast_fp16 = einsum(equation = var_322_equation_0, values = (var_292_cast_fp16_2, var_313_cast_fp16))[name = tensor("op_322_cast_fp16")]; tensor var_324_equation_0 = const()[name = tensor("op_324_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_324_cast_fp16 = einsum(equation = var_324_equation_0, values = (var_292_cast_fp16_3, var_314_cast_fp16))[name = tensor("op_324_cast_fp16")]; tensor var_326_equation_0 = const()[name = tensor("op_326_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_326_cast_fp16 = einsum(equation = var_326_equation_0, values = (var_292_cast_fp16_4, var_315_cast_fp16))[name = tensor("op_326_cast_fp16")]; tensor var_328_equation_0 = const()[name = tensor("op_328_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_328_cast_fp16 = einsum(equation = var_328_equation_0, values = (var_292_cast_fp16_5, var_316_cast_fp16))[name = tensor("op_328_cast_fp16")]; tensor input_15_interleave_0 = const()[name = tensor("input_15_interleave_0"), val = tensor(false)]; tensor input_15_cast_fp16 = concat(axis = var_225, interleave = input_15_interleave_0, values = (var_318_cast_fp16, var_320_cast_fp16, var_322_cast_fp16, var_324_cast_fp16, var_326_cast_fp16, var_328_cast_fp16))[name = tensor("input_15_cast_fp16")]; tensor var_337_pad_type_0 = const()[name = tensor("op_337_pad_type_0"), val = tensor("valid")]; tensor var_337_strides_0 = const()[name = tensor("op_337_strides_0"), val = tensor([1, 1])]; tensor var_337_pad_0 = const()[name = tensor("op_337_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_337_dilations_0 = const()[name = tensor("op_337_dilations_0"), val = tensor([1, 1])]; tensor var_337_groups_0 = const()[name = tensor("op_337_groups_0"), val = tensor(1)]; tensor blocks_1_attn_out_weight_to_fp16 = const()[name = tensor("blocks_1_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6660352)))]; tensor blocks_1_attn_out_bias_to_fp16 = const()[name = tensor("blocks_1_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6955328)))]; tensor var_337_cast_fp16 = conv(bias = blocks_1_attn_out_bias_to_fp16, dilations = var_337_dilations_0, groups = var_337_groups_0, pad = var_337_pad_0, pad_type = var_337_pad_type_0, strides = var_337_strides_0, weight = blocks_1_attn_out_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("op_337_cast_fp16")]; tensor inputs_7_cast_fp16 = add(x = inputs_5_cast_fp16, y = var_337_cast_fp16)[name = tensor("inputs_7_cast_fp16")]; tensor input_17_axes_0 = const()[name = tensor("input_17_axes_0"), val = tensor([1])]; tensor input_17_gamma_0_to_fp16 = const()[name = tensor("input_17_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6956160)))]; tensor input_17_beta_0_to_fp16 = const()[name = tensor("input_17_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6956992)))]; tensor var_347_to_fp16 = const()[name = tensor("op_347_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_17_cast_fp16 = layer_norm(axes = input_17_axes_0, beta = input_17_beta_0_to_fp16, epsilon = var_347_to_fp16, gamma = input_17_gamma_0_to_fp16, x = inputs_7_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor input_19_pad_type_0 = const()[name = tensor("input_19_pad_type_0"), val = tensor("valid")]; tensor input_19_strides_0 = const()[name = tensor("input_19_strides_0"), val = tensor([1, 1])]; tensor input_19_pad_0 = const()[name = tensor("input_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_19_dilations_0 = const()[name = tensor("input_19_dilations_0"), val = tensor([1, 1])]; tensor input_19_groups_0 = const()[name = tensor("input_19_groups_0"), val = tensor(1)]; tensor blocks_1_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6957824)))]; tensor blocks_1_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8137536)))]; tensor input_19_cast_fp16 = conv(bias = blocks_1_mlp_0_bias_to_fp16, dilations = input_19_dilations_0, groups = input_19_groups_0, pad = input_19_pad_0, pad_type = input_19_pad_type_0, strides = input_19_strides_0, weight = blocks_1_mlp_0_weight_to_fp16, x = input_17_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor input_21_mode_0 = const()[name = tensor("input_21_mode_0"), val = tensor("EXACT")]; tensor input_21_cast_fp16 = gelu(mode = input_21_mode_0, x = input_19_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor var_373_pad_type_0 = const()[name = tensor("op_373_pad_type_0"), val = tensor("valid")]; tensor var_373_strides_0 = const()[name = tensor("op_373_strides_0"), val = tensor([1, 1])]; tensor var_373_pad_0 = const()[name = tensor("op_373_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_373_dilations_0 = const()[name = tensor("op_373_dilations_0"), val = tensor([1, 1])]; tensor var_373_groups_0 = const()[name = tensor("op_373_groups_0"), val = tensor(1)]; tensor blocks_1_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8140672)))]; tensor blocks_1_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9320384)))]; tensor var_373_cast_fp16 = conv(bias = blocks_1_mlp_2_bias_to_fp16, dilations = var_373_dilations_0, groups = var_373_groups_0, pad = var_373_pad_0, pad_type = var_373_pad_type_0, strides = var_373_strides_0, weight = blocks_1_mlp_2_weight_to_fp16, x = input_21_cast_fp16)[name = tensor("op_373_cast_fp16")]; tensor inputs_9_cast_fp16 = add(x = inputs_7_cast_fp16, y = var_373_cast_fp16)[name = tensor("inputs_9_cast_fp16")]; tensor var_382 = const()[name = tensor("op_382"), val = tensor(1)]; tensor input_23_axes_0 = const()[name = tensor("input_23_axes_0"), val = tensor([1])]; tensor input_23_gamma_0_to_fp16 = const()[name = tensor("input_23_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9321216)))]; tensor input_23_beta_0_to_fp16 = const()[name = tensor("input_23_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9322048)))]; tensor var_398_to_fp16 = const()[name = tensor("op_398_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_23_cast_fp16 = layer_norm(axes = input_23_axes_0, beta = input_23_beta_0_to_fp16, epsilon = var_398_to_fp16, gamma = input_23_gamma_0_to_fp16, x = inputs_9_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor q_5_pad_type_0 = const()[name = tensor("q_5_pad_type_0"), val = tensor("valid")]; tensor q_5_strides_0 = const()[name = tensor("q_5_strides_0"), val = tensor([1, 1])]; tensor q_5_pad_0 = const()[name = tensor("q_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_5_dilations_0 = const()[name = tensor("q_5_dilations_0"), val = tensor([1, 1])]; tensor q_5_groups_0 = const()[name = tensor("q_5_groups_0"), val = tensor(1)]; tensor var_433_weight_0_to_fp16 = const()[name = tensor("op_433_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9322880)))]; tensor var_433_bias_0_to_fp16 = const()[name = tensor("op_433_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9617856)))]; tensor var_433_cast_fp16 = conv(bias = var_433_bias_0_to_fp16, dilations = q_5_dilations_0, groups = q_5_groups_0, pad = q_5_pad_0, pad_type = q_5_pad_type_0, strides = q_5_strides_0, weight = var_433_weight_0_to_fp16, x = input_23_cast_fp16)[name = tensor("op_433_cast_fp16")]; tensor k_5_pad_type_0 = const()[name = tensor("k_5_pad_type_0"), val = tensor("valid")]; tensor k_5_strides_0 = const()[name = tensor("k_5_strides_0"), val = tensor([1, 1])]; tensor k_5_pad_0 = const()[name = tensor("k_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_5_dilations_0 = const()[name = tensor("k_5_dilations_0"), val = tensor([1, 1])]; tensor k_5_groups_0 = const()[name = tensor("k_5_groups_0"), val = tensor(1)]; tensor blocks_2_attn_key_weight_to_fp16 = const()[name = tensor("blocks_2_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9618688)))]; tensor k_5_cast_fp16 = conv(dilations = k_5_dilations_0, groups = k_5_groups_0, pad = k_5_pad_0, pad_type = k_5_pad_type_0, strides = k_5_strides_0, weight = blocks_2_attn_key_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("k_5_cast_fp16")]; tensor var_431_pad_type_0 = const()[name = tensor("op_431_pad_type_0"), val = tensor("valid")]; tensor var_431_strides_0 = const()[name = tensor("op_431_strides_0"), val = tensor([1, 1])]; tensor var_431_pad_0 = const()[name = tensor("op_431_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_431_dilations_0 = const()[name = tensor("op_431_dilations_0"), val = tensor([1, 1])]; tensor var_431_groups_0 = const()[name = tensor("op_431_groups_0"), val = tensor(1)]; tensor blocks_2_attn_value_weight_to_fp16 = const()[name = tensor("blocks_2_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9913664)))]; tensor blocks_2_attn_value_bias_to_fp16 = const()[name = tensor("blocks_2_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10208640)))]; tensor var_431_cast_fp16 = conv(bias = blocks_2_attn_value_bias_to_fp16, dilations = var_431_dilations_0, groups = var_431_groups_0, pad = var_431_pad_0, pad_type = var_431_pad_type_0, strides = var_431_strides_0, weight = blocks_2_attn_value_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("op_431_cast_fp16")]; tensor tile_6 = const()[name = tensor("tile_6"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_434_axis_0 = const()[name = tensor("op_434_axis_0"), val = tensor(1)]; tensor var_434_cast_fp16_0, tensor var_434_cast_fp16_1, tensor var_434_cast_fp16_2, tensor var_434_cast_fp16_3, tensor var_434_cast_fp16_4, tensor var_434_cast_fp16_5 = split(axis = var_434_axis_0, split_sizes = tile_6, x = var_433_cast_fp16)[name = tensor("op_434_cast_fp16")]; tensor var_441_perm_0 = const()[name = tensor("op_441_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_7 = const()[name = tensor("tile_7"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_442_axis_0 = const()[name = tensor("op_442_axis_0"), val = tensor(3)]; tensor var_441_cast_fp16 = transpose(perm = var_441_perm_0, x = k_5_cast_fp16)[name = tensor("transpose_2")]; tensor var_442_cast_fp16_0, tensor var_442_cast_fp16_1, tensor var_442_cast_fp16_2, tensor var_442_cast_fp16_3, tensor var_442_cast_fp16_4, tensor var_442_cast_fp16_5 = split(axis = var_442_axis_0, split_sizes = tile_7, x = var_441_cast_fp16)[name = tensor("op_442_cast_fp16")]; tensor tile_8 = const()[name = tensor("tile_8"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_449_axis_0 = const()[name = tensor("op_449_axis_0"), val = tensor(1)]; tensor var_449_cast_fp16_0, tensor var_449_cast_fp16_1, tensor var_449_cast_fp16_2, tensor var_449_cast_fp16_3, tensor var_449_cast_fp16_4, tensor var_449_cast_fp16_5 = split(axis = var_449_axis_0, split_sizes = tile_8, x = var_431_cast_fp16)[name = tensor("op_449_cast_fp16")]; tensor aw_25_equation_0 = const()[name = tensor("aw_25_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_25_cast_fp16 = einsum(equation = aw_25_equation_0, values = (var_442_cast_fp16_0, var_434_cast_fp16_0))[name = tensor("aw_25_cast_fp16")]; tensor aw_27_equation_0 = const()[name = tensor("aw_27_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_27_cast_fp16 = einsum(equation = aw_27_equation_0, values = (var_442_cast_fp16_1, var_434_cast_fp16_1))[name = tensor("aw_27_cast_fp16")]; tensor aw_29_equation_0 = const()[name = tensor("aw_29_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_29_cast_fp16 = einsum(equation = aw_29_equation_0, values = (var_442_cast_fp16_2, var_434_cast_fp16_2))[name = tensor("aw_29_cast_fp16")]; tensor aw_31_equation_0 = const()[name = tensor("aw_31_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_31_cast_fp16 = einsum(equation = aw_31_equation_0, values = (var_442_cast_fp16_3, var_434_cast_fp16_3))[name = tensor("aw_31_cast_fp16")]; tensor aw_33_equation_0 = const()[name = tensor("aw_33_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_33_cast_fp16 = einsum(equation = aw_33_equation_0, values = (var_442_cast_fp16_4, var_434_cast_fp16_4))[name = tensor("aw_33_cast_fp16")]; tensor aw_35_equation_0 = const()[name = tensor("aw_35_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_35_cast_fp16 = einsum(equation = aw_35_equation_0, values = (var_442_cast_fp16_5, var_434_cast_fp16_5))[name = tensor("aw_35_cast_fp16")]; tensor var_468_cast_fp16 = softmax(axis = var_382, x = aw_25_cast_fp16)[name = tensor("op_468_cast_fp16")]; tensor var_469_cast_fp16 = softmax(axis = var_382, x = aw_27_cast_fp16)[name = tensor("op_469_cast_fp16")]; tensor var_470_cast_fp16 = softmax(axis = var_382, x = aw_29_cast_fp16)[name = tensor("op_470_cast_fp16")]; tensor var_471_cast_fp16 = softmax(axis = var_382, x = aw_31_cast_fp16)[name = tensor("op_471_cast_fp16")]; tensor var_472_cast_fp16 = softmax(axis = var_382, x = aw_33_cast_fp16)[name = tensor("op_472_cast_fp16")]; tensor var_473_cast_fp16 = softmax(axis = var_382, x = aw_35_cast_fp16)[name = tensor("op_473_cast_fp16")]; tensor var_475_equation_0 = const()[name = tensor("op_475_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_475_cast_fp16 = einsum(equation = var_475_equation_0, values = (var_449_cast_fp16_0, var_468_cast_fp16))[name = tensor("op_475_cast_fp16")]; tensor var_477_equation_0 = const()[name = tensor("op_477_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_477_cast_fp16 = einsum(equation = var_477_equation_0, values = (var_449_cast_fp16_1, var_469_cast_fp16))[name = tensor("op_477_cast_fp16")]; tensor var_479_equation_0 = const()[name = tensor("op_479_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_479_cast_fp16 = einsum(equation = var_479_equation_0, values = (var_449_cast_fp16_2, var_470_cast_fp16))[name = tensor("op_479_cast_fp16")]; tensor var_481_equation_0 = const()[name = tensor("op_481_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_481_cast_fp16 = einsum(equation = var_481_equation_0, values = (var_449_cast_fp16_3, var_471_cast_fp16))[name = tensor("op_481_cast_fp16")]; tensor var_483_equation_0 = const()[name = tensor("op_483_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_483_cast_fp16 = einsum(equation = var_483_equation_0, values = (var_449_cast_fp16_4, var_472_cast_fp16))[name = tensor("op_483_cast_fp16")]; tensor var_485_equation_0 = const()[name = tensor("op_485_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_485_cast_fp16 = einsum(equation = var_485_equation_0, values = (var_449_cast_fp16_5, var_473_cast_fp16))[name = tensor("op_485_cast_fp16")]; tensor input_25_interleave_0 = const()[name = tensor("input_25_interleave_0"), val = tensor(false)]; tensor input_25_cast_fp16 = concat(axis = var_382, interleave = input_25_interleave_0, values = (var_475_cast_fp16, var_477_cast_fp16, var_479_cast_fp16, var_481_cast_fp16, var_483_cast_fp16, var_485_cast_fp16))[name = tensor("input_25_cast_fp16")]; tensor var_494_pad_type_0 = const()[name = tensor("op_494_pad_type_0"), val = tensor("valid")]; tensor var_494_strides_0 = const()[name = tensor("op_494_strides_0"), val = tensor([1, 1])]; tensor var_494_pad_0 = const()[name = tensor("op_494_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_494_dilations_0 = const()[name = tensor("op_494_dilations_0"), val = tensor([1, 1])]; tensor var_494_groups_0 = const()[name = tensor("op_494_groups_0"), val = tensor(1)]; tensor blocks_2_attn_out_weight_to_fp16 = const()[name = tensor("blocks_2_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10209472)))]; tensor blocks_2_attn_out_bias_to_fp16 = const()[name = tensor("blocks_2_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10504448)))]; tensor var_494_cast_fp16 = conv(bias = blocks_2_attn_out_bias_to_fp16, dilations = var_494_dilations_0, groups = var_494_groups_0, pad = var_494_pad_0, pad_type = var_494_pad_type_0, strides = var_494_strides_0, weight = blocks_2_attn_out_weight_to_fp16, x = input_25_cast_fp16)[name = tensor("op_494_cast_fp16")]; tensor inputs_11_cast_fp16 = add(x = inputs_9_cast_fp16, y = var_494_cast_fp16)[name = tensor("inputs_11_cast_fp16")]; tensor input_27_axes_0 = const()[name = tensor("input_27_axes_0"), val = tensor([1])]; tensor input_27_gamma_0_to_fp16 = const()[name = tensor("input_27_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10505280)))]; tensor input_27_beta_0_to_fp16 = const()[name = tensor("input_27_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10506112)))]; tensor var_504_to_fp16 = const()[name = tensor("op_504_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_27_cast_fp16 = layer_norm(axes = input_27_axes_0, beta = input_27_beta_0_to_fp16, epsilon = var_504_to_fp16, gamma = input_27_gamma_0_to_fp16, x = inputs_11_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor input_29_pad_type_0 = const()[name = tensor("input_29_pad_type_0"), val = tensor("valid")]; tensor input_29_strides_0 = const()[name = tensor("input_29_strides_0"), val = tensor([1, 1])]; tensor input_29_pad_0 = const()[name = tensor("input_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_29_dilations_0 = const()[name = tensor("input_29_dilations_0"), val = tensor([1, 1])]; tensor input_29_groups_0 = const()[name = tensor("input_29_groups_0"), val = tensor(1)]; tensor blocks_2_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10506944)))]; tensor blocks_2_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11686656)))]; tensor input_29_cast_fp16 = conv(bias = blocks_2_mlp_0_bias_to_fp16, dilations = input_29_dilations_0, groups = input_29_groups_0, pad = input_29_pad_0, pad_type = input_29_pad_type_0, strides = input_29_strides_0, weight = blocks_2_mlp_0_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor input_31_mode_0 = const()[name = tensor("input_31_mode_0"), val = tensor("EXACT")]; tensor input_31_cast_fp16 = gelu(mode = input_31_mode_0, x = input_29_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor var_530_pad_type_0 = const()[name = tensor("op_530_pad_type_0"), val = tensor("valid")]; tensor var_530_strides_0 = const()[name = tensor("op_530_strides_0"), val = tensor([1, 1])]; tensor var_530_pad_0 = const()[name = tensor("op_530_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_530_dilations_0 = const()[name = tensor("op_530_dilations_0"), val = tensor([1, 1])]; tensor var_530_groups_0 = const()[name = tensor("op_530_groups_0"), val = tensor(1)]; tensor blocks_2_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11689792)))]; tensor blocks_2_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12869504)))]; tensor var_530_cast_fp16 = conv(bias = blocks_2_mlp_2_bias_to_fp16, dilations = var_530_dilations_0, groups = var_530_groups_0, pad = var_530_pad_0, pad_type = var_530_pad_type_0, strides = var_530_strides_0, weight = blocks_2_mlp_2_weight_to_fp16, x = input_31_cast_fp16)[name = tensor("op_530_cast_fp16")]; tensor inputs_13_cast_fp16 = add(x = inputs_11_cast_fp16, y = var_530_cast_fp16)[name = tensor("inputs_13_cast_fp16")]; tensor var_539 = const()[name = tensor("op_539"), val = tensor(1)]; tensor input_33_axes_0 = const()[name = tensor("input_33_axes_0"), val = tensor([1])]; tensor input_33_gamma_0_to_fp16 = const()[name = tensor("input_33_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12870336)))]; tensor input_33_beta_0_to_fp16 = const()[name = tensor("input_33_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12871168)))]; tensor var_555_to_fp16 = const()[name = tensor("op_555_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_33_cast_fp16 = layer_norm(axes = input_33_axes_0, beta = input_33_beta_0_to_fp16, epsilon = var_555_to_fp16, gamma = input_33_gamma_0_to_fp16, x = inputs_13_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor q_pad_type_0 = const()[name = tensor("q_pad_type_0"), val = tensor("valid")]; tensor q_strides_0 = const()[name = tensor("q_strides_0"), val = tensor([1, 1])]; tensor q_pad_0 = const()[name = tensor("q_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_dilations_0 = const()[name = tensor("q_dilations_0"), val = tensor([1, 1])]; tensor q_groups_0 = const()[name = tensor("q_groups_0"), val = tensor(1)]; tensor var_590_weight_0_to_fp16 = const()[name = tensor("op_590_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12872000)))]; tensor var_590_bias_0_to_fp16 = const()[name = tensor("op_590_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13166976)))]; tensor var_590_cast_fp16 = conv(bias = var_590_bias_0_to_fp16, dilations = q_dilations_0, groups = q_groups_0, pad = q_pad_0, pad_type = q_pad_type_0, strides = q_strides_0, weight = var_590_weight_0_to_fp16, x = input_33_cast_fp16)[name = tensor("op_590_cast_fp16")]; tensor k_pad_type_0 = const()[name = tensor("k_pad_type_0"), val = tensor("valid")]; tensor k_strides_0 = const()[name = tensor("k_strides_0"), val = tensor([1, 1])]; tensor k_pad_0 = const()[name = tensor("k_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_dilations_0 = const()[name = tensor("k_dilations_0"), val = tensor([1, 1])]; tensor k_groups_0 = const()[name = tensor("k_groups_0"), val = tensor(1)]; tensor blocks_3_attn_key_weight_to_fp16 = const()[name = tensor("blocks_3_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13167808)))]; tensor k_cast_fp16 = conv(dilations = k_dilations_0, groups = k_groups_0, pad = k_pad_0, pad_type = k_pad_type_0, strides = k_strides_0, weight = blocks_3_attn_key_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("k_cast_fp16")]; tensor var_588_pad_type_0 = const()[name = tensor("op_588_pad_type_0"), val = tensor("valid")]; tensor var_588_strides_0 = const()[name = tensor("op_588_strides_0"), val = tensor([1, 1])]; tensor var_588_pad_0 = const()[name = tensor("op_588_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_588_dilations_0 = const()[name = tensor("op_588_dilations_0"), val = tensor([1, 1])]; tensor var_588_groups_0 = const()[name = tensor("op_588_groups_0"), val = tensor(1)]; tensor blocks_3_attn_value_weight_to_fp16 = const()[name = tensor("blocks_3_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13462784)))]; tensor blocks_3_attn_value_bias_to_fp16 = const()[name = tensor("blocks_3_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13757760)))]; tensor var_588_cast_fp16 = conv(bias = blocks_3_attn_value_bias_to_fp16, dilations = var_588_dilations_0, groups = var_588_groups_0, pad = var_588_pad_0, pad_type = var_588_pad_type_0, strides = var_588_strides_0, weight = blocks_3_attn_value_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("op_588_cast_fp16")]; tensor tile_9 = const()[name = tensor("tile_9"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_591_axis_0 = const()[name = tensor("op_591_axis_0"), val = tensor(1)]; tensor var_591_cast_fp16_0, tensor var_591_cast_fp16_1, tensor var_591_cast_fp16_2, tensor var_591_cast_fp16_3, tensor var_591_cast_fp16_4, tensor var_591_cast_fp16_5 = split(axis = var_591_axis_0, split_sizes = tile_9, x = var_590_cast_fp16)[name = tensor("op_591_cast_fp16")]; tensor var_598_perm_0 = const()[name = tensor("op_598_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_10 = const()[name = tensor("tile_10"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_599_axis_0 = const()[name = tensor("op_599_axis_0"), val = tensor(3)]; tensor var_598_cast_fp16 = transpose(perm = var_598_perm_0, x = k_cast_fp16)[name = tensor("transpose_1")]; tensor var_599_cast_fp16_0, tensor var_599_cast_fp16_1, tensor var_599_cast_fp16_2, tensor var_599_cast_fp16_3, tensor var_599_cast_fp16_4, tensor var_599_cast_fp16_5 = split(axis = var_599_axis_0, split_sizes = tile_10, x = var_598_cast_fp16)[name = tensor("op_599_cast_fp16")]; tensor tile_11 = const()[name = tensor("tile_11"), val = tensor([64, 64, 64, 64, 64, 64])]; tensor var_606_axis_0 = const()[name = tensor("op_606_axis_0"), val = tensor(1)]; tensor var_606_cast_fp16_0, tensor var_606_cast_fp16_1, tensor var_606_cast_fp16_2, tensor var_606_cast_fp16_3, tensor var_606_cast_fp16_4, tensor var_606_cast_fp16_5 = split(axis = var_606_axis_0, split_sizes = tile_11, x = var_588_cast_fp16)[name = tensor("op_606_cast_fp16")]; tensor aw_37_equation_0 = const()[name = tensor("aw_37_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_37_cast_fp16 = einsum(equation = aw_37_equation_0, values = (var_599_cast_fp16_0, var_591_cast_fp16_0))[name = tensor("aw_37_cast_fp16")]; tensor aw_39_equation_0 = const()[name = tensor("aw_39_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_39_cast_fp16 = einsum(equation = aw_39_equation_0, values = (var_599_cast_fp16_1, var_591_cast_fp16_1))[name = tensor("aw_39_cast_fp16")]; tensor aw_41_equation_0 = const()[name = tensor("aw_41_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_41_cast_fp16 = einsum(equation = aw_41_equation_0, values = (var_599_cast_fp16_2, var_591_cast_fp16_2))[name = tensor("aw_41_cast_fp16")]; tensor aw_43_equation_0 = const()[name = tensor("aw_43_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_43_cast_fp16 = einsum(equation = aw_43_equation_0, values = (var_599_cast_fp16_3, var_591_cast_fp16_3))[name = tensor("aw_43_cast_fp16")]; tensor aw_45_equation_0 = const()[name = tensor("aw_45_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_45_cast_fp16 = einsum(equation = aw_45_equation_0, values = (var_599_cast_fp16_4, var_591_cast_fp16_4))[name = tensor("aw_45_cast_fp16")]; tensor aw_equation_0 = const()[name = tensor("aw_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_cast_fp16 = einsum(equation = aw_equation_0, values = (var_599_cast_fp16_5, var_591_cast_fp16_5))[name = tensor("aw_cast_fp16")]; tensor var_625_cast_fp16 = softmax(axis = var_539, x = aw_37_cast_fp16)[name = tensor("op_625_cast_fp16")]; tensor var_626_cast_fp16 = softmax(axis = var_539, x = aw_39_cast_fp16)[name = tensor("op_626_cast_fp16")]; tensor var_627_cast_fp16 = softmax(axis = var_539, x = aw_41_cast_fp16)[name = tensor("op_627_cast_fp16")]; tensor var_628_cast_fp16 = softmax(axis = var_539, x = aw_43_cast_fp16)[name = tensor("op_628_cast_fp16")]; tensor var_629_cast_fp16 = softmax(axis = var_539, x = aw_45_cast_fp16)[name = tensor("op_629_cast_fp16")]; tensor var_630_cast_fp16 = softmax(axis = var_539, x = aw_cast_fp16)[name = tensor("op_630_cast_fp16")]; tensor var_632_equation_0 = const()[name = tensor("op_632_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_632_cast_fp16 = einsum(equation = var_632_equation_0, values = (var_606_cast_fp16_0, var_625_cast_fp16))[name = tensor("op_632_cast_fp16")]; tensor var_634_equation_0 = const()[name = tensor("op_634_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_634_cast_fp16 = einsum(equation = var_634_equation_0, values = (var_606_cast_fp16_1, var_626_cast_fp16))[name = tensor("op_634_cast_fp16")]; tensor var_636_equation_0 = const()[name = tensor("op_636_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_636_cast_fp16 = einsum(equation = var_636_equation_0, values = (var_606_cast_fp16_2, var_627_cast_fp16))[name = tensor("op_636_cast_fp16")]; tensor var_638_equation_0 = const()[name = tensor("op_638_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_638_cast_fp16 = einsum(equation = var_638_equation_0, values = (var_606_cast_fp16_3, var_628_cast_fp16))[name = tensor("op_638_cast_fp16")]; tensor var_640_equation_0 = const()[name = tensor("op_640_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_640_cast_fp16 = einsum(equation = var_640_equation_0, values = (var_606_cast_fp16_4, var_629_cast_fp16))[name = tensor("op_640_cast_fp16")]; tensor var_642_equation_0 = const()[name = tensor("op_642_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_642_cast_fp16 = einsum(equation = var_642_equation_0, values = (var_606_cast_fp16_5, var_630_cast_fp16))[name = tensor("op_642_cast_fp16")]; tensor input_35_interleave_0 = const()[name = tensor("input_35_interleave_0"), val = tensor(false)]; tensor input_35_cast_fp16 = concat(axis = var_539, interleave = input_35_interleave_0, values = (var_632_cast_fp16, var_634_cast_fp16, var_636_cast_fp16, var_638_cast_fp16, var_640_cast_fp16, var_642_cast_fp16))[name = tensor("input_35_cast_fp16")]; tensor var_651_pad_type_0 = const()[name = tensor("op_651_pad_type_0"), val = tensor("valid")]; tensor var_651_strides_0 = const()[name = tensor("op_651_strides_0"), val = tensor([1, 1])]; tensor var_651_pad_0 = const()[name = tensor("op_651_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_651_dilations_0 = const()[name = tensor("op_651_dilations_0"), val = tensor([1, 1])]; tensor var_651_groups_0 = const()[name = tensor("op_651_groups_0"), val = tensor(1)]; tensor blocks_3_attn_out_weight_to_fp16 = const()[name = tensor("blocks_3_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13758592)))]; tensor blocks_3_attn_out_bias_to_fp16 = const()[name = tensor("blocks_3_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14053568)))]; tensor var_651_cast_fp16 = conv(bias = blocks_3_attn_out_bias_to_fp16, dilations = var_651_dilations_0, groups = var_651_groups_0, pad = var_651_pad_0, pad_type = var_651_pad_type_0, strides = var_651_strides_0, weight = blocks_3_attn_out_weight_to_fp16, x = input_35_cast_fp16)[name = tensor("op_651_cast_fp16")]; tensor inputs_15_cast_fp16 = add(x = inputs_13_cast_fp16, y = var_651_cast_fp16)[name = tensor("inputs_15_cast_fp16")]; tensor input_37_axes_0 = const()[name = tensor("input_37_axes_0"), val = tensor([1])]; tensor input_37_gamma_0_to_fp16 = const()[name = tensor("input_37_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14054400)))]; tensor input_37_beta_0_to_fp16 = const()[name = tensor("input_37_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14055232)))]; tensor var_661_to_fp16 = const()[name = tensor("op_661_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_37_cast_fp16 = layer_norm(axes = input_37_axes_0, beta = input_37_beta_0_to_fp16, epsilon = var_661_to_fp16, gamma = input_37_gamma_0_to_fp16, x = inputs_15_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor input_39_pad_type_0 = const()[name = tensor("input_39_pad_type_0"), val = tensor("valid")]; tensor input_39_strides_0 = const()[name = tensor("input_39_strides_0"), val = tensor([1, 1])]; tensor input_39_pad_0 = const()[name = tensor("input_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_39_dilations_0 = const()[name = tensor("input_39_dilations_0"), val = tensor([1, 1])]; tensor input_39_groups_0 = const()[name = tensor("input_39_groups_0"), val = tensor(1)]; tensor blocks_3_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14056064)))]; tensor blocks_3_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15235776)))]; tensor input_39_cast_fp16 = conv(bias = blocks_3_mlp_0_bias_to_fp16, dilations = input_39_dilations_0, groups = input_39_groups_0, pad = input_39_pad_0, pad_type = input_39_pad_type_0, strides = input_39_strides_0, weight = blocks_3_mlp_0_weight_to_fp16, x = input_37_cast_fp16)[name = tensor("input_39_cast_fp16")]; tensor input_mode_0 = const()[name = tensor("input_mode_0"), val = tensor("EXACT")]; tensor input_cast_fp16 = gelu(mode = input_mode_0, x = input_39_cast_fp16)[name = tensor("input_cast_fp16")]; tensor var_687_pad_type_0 = const()[name = tensor("op_687_pad_type_0"), val = tensor("valid")]; tensor var_687_strides_0 = const()[name = tensor("op_687_strides_0"), val = tensor([1, 1])]; tensor var_687_pad_0 = const()[name = tensor("op_687_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_687_dilations_0 = const()[name = tensor("op_687_dilations_0"), val = tensor([1, 1])]; tensor var_687_groups_0 = const()[name = tensor("op_687_groups_0"), val = tensor(1)]; tensor blocks_3_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15238912)))]; tensor blocks_3_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16418624)))]; tensor var_687_cast_fp16 = conv(bias = blocks_3_mlp_2_bias_to_fp16, dilations = var_687_dilations_0, groups = var_687_groups_0, pad = var_687_pad_0, pad_type = var_687_pad_type_0, strides = var_687_strides_0, weight = blocks_3_mlp_2_weight_to_fp16, x = input_cast_fp16)[name = tensor("op_687_cast_fp16")]; tensor inputs_cast_fp16 = add(x = inputs_15_cast_fp16, y = var_687_cast_fp16)[name = tensor("inputs_cast_fp16")]; tensor x_axes_0 = const()[name = tensor("x_axes_0"), val = tensor([1])]; tensor x_gamma_0_to_fp16 = const()[name = tensor("x_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16419456)))]; tensor x_beta_0_to_fp16 = const()[name = tensor("x_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16420288)))]; tensor var_701_to_fp16 = const()[name = tensor("op_701_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_cast_fp16 = layer_norm(axes = x_axes_0, beta = x_beta_0_to_fp16, epsilon = var_701_to_fp16, gamma = x_gamma_0_to_fp16, x = inputs_cast_fp16)[name = tensor("x_cast_fp16")]; tensor var_712_axes_0 = const()[name = tensor("op_712_axes_0"), val = tensor([2])]; tensor var_712_cast_fp16 = squeeze(axes = var_712_axes_0, x = x_cast_fp16)[name = tensor("op_712_cast_fp16")]; tensor var_715_perm_0 = const()[name = tensor("op_715_perm_0"), val = tensor([0, 2, 1])]; tensor var_715_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_715_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor var_715_cast_fp16 = transpose(perm = var_715_perm_0, x = var_712_cast_fp16)[name = tensor("transpose_0")]; tensor output = cast(dtype = var_715_cast_fp16_to_fp32_dtype_0, x = var_715_cast_fp16)[name = tensor("cast_19")]; } -> (output); }