program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "5.33.5"}, {"coremlc-version", "1877.40.3"}, {"coremltools-component-torch", "1.11.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "7.1"}})] { func main(tensor logmel_data) { tensor var_20 = const()[name = tensor("op_20"), val = tensor(1)]; tensor var_28 = const()[name = tensor("op_28"), val = tensor([1])]; tensor var_30 = const()[name = tensor("op_30"), val = tensor([1])]; tensor var_32_pad_type_0 = const()[name = tensor("op_32_pad_type_0"), val = tensor("custom")]; tensor var_32_pad_0 = const()[name = tensor("op_32_pad_0"), val = tensor([1, 1])]; tensor logmel_data_to_fp16_dtype_0 = const()[name = tensor("logmel_data_to_fp16_dtype_0"), val = tensor("fp16")]; tensor weight_3_to_fp16 = const()[name = tensor("weight_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor bias_3_to_fp16 = const()[name = tensor("bias_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245888)))]; tensor cast_37 = cast(dtype = logmel_data_to_fp16_dtype_0, x = logmel_data)[name = tensor("cast_37")]; tensor var_32_cast_fp16 = conv(bias = bias_3_to_fp16, dilations = var_30, groups = var_20, pad = var_32_pad_0, pad_type = var_32_pad_type_0, strides = var_28, weight = weight_3_to_fp16, x = cast_37)[name = tensor("op_32_cast_fp16")]; tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast_fp16 = gelu(mode = input_1_mode_0, x = var_32_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_36 = const()[name = tensor("op_36"), val = tensor(1)]; tensor var_45 = const()[name = tensor("op_45"), val = tensor([2])]; tensor var_47 = const()[name = tensor("op_47"), val = tensor([1])]; tensor var_49_pad_type_0 = const()[name = tensor("op_49_pad_type_0"), val = tensor("custom")]; tensor var_49_pad_0 = const()[name = tensor("op_49_pad_0"), val = tensor([1, 1])]; tensor weight_7_to_fp16 = const()[name = tensor("weight_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246976)))]; tensor bias_7_to_fp16 = const()[name = tensor("bias_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1819904)))]; tensor var_49_cast_fp16 = conv(bias = bias_7_to_fp16, dilations = var_47, groups = var_36, pad = var_49_pad_0, pad_type = var_49_pad_type_0, strides = var_45, weight = weight_7_to_fp16, x = input_1_cast_fp16)[name = tensor("op_49_cast_fp16")]; tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; tensor x_3_cast_fp16 = gelu(mode = x_3_mode_0, x = var_49_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor var_54 = const()[name = tensor("op_54"), val = tensor([0, 2, 1])]; tensor positional_embedding_to_fp16 = const()[name = tensor("positional_embedding_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1820992)))]; tensor transpose_60 = transpose(perm = var_54, x = x_3_cast_fp16)[name = tensor("transpose_60")]; tensor var_57_cast_fp16 = add(x = transpose_60, y = positional_embedding_to_fp16)[name = tensor("op_57_cast_fp16")]; tensor var_70 = const()[name = tensor("op_70"), val = tensor(-1)]; tensor var_87_axes_0 = const()[name = tensor("op_87_axes_0"), val = tensor([-1])]; tensor blocks_0_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_0_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3357056)))]; tensor blocks_0_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_0_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3358144)))]; tensor var_76_to_fp16 = const()[name = tensor("op_76_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_87_cast_fp16 = layer_norm(axes = var_87_axes_0, beta = blocks_0_attn_ln_bias_to_fp16, epsilon = var_76_to_fp16, gamma = blocks_0_attn_ln_weight_to_fp16, x = var_57_cast_fp16)[name = tensor("op_87_cast_fp16")]; tensor var_98_to_fp16 = const()[name = tensor("op_98_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3359232)))]; tensor var_99_to_fp16 = const()[name = tensor("op_99_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3883584)))]; tensor linear_0_cast_fp16 = linear(bias = var_99_to_fp16, weight = var_98_to_fp16, x = var_87_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor var_102_to_fp16 = const()[name = tensor("op_102_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3884672)))]; tensor linear_1_bias_0_to_fp16 = const()[name = tensor("linear_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4409024)))]; tensor linear_1_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_102_to_fp16, x = var_87_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor var_106_to_fp16 = const()[name = tensor("op_106_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4410112)))]; tensor var_107_to_fp16 = const()[name = tensor("op_107_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4934464)))]; tensor linear_2_cast_fp16 = linear(bias = var_107_to_fp16, weight = var_106_to_fp16, x = var_87_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor var_115 = const()[name = tensor("op_115"), val = tensor([1, 1500, 8, -1])]; tensor var_116_cast_fp16 = reshape(shape = var_115, x = linear_0_cast_fp16)[name = tensor("op_116_cast_fp16")]; tensor const_42_to_fp16 = const()[name = tensor("const_42_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_3_cast_fp16 = mul(x = var_116_cast_fp16, y = const_42_to_fp16)[name = tensor("q_3_cast_fp16")]; tensor var_122 = const()[name = tensor("op_122"), val = tensor([1, 1500, 8, -1])]; tensor var_123_cast_fp16 = reshape(shape = var_122, x = linear_1_cast_fp16)[name = tensor("op_123_cast_fp16")]; tensor const_43_to_fp16 = const()[name = tensor("const_43_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_3_cast_fp16 = mul(x = var_123_cast_fp16, y = const_43_to_fp16)[name = tensor("k_3_cast_fp16")]; tensor var_129 = const()[name = tensor("op_129"), val = tensor([1, 1500, 8, -1])]; tensor var_130_cast_fp16 = reshape(shape = var_129, x = linear_2_cast_fp16)[name = tensor("op_130_cast_fp16")]; tensor var_131 = const()[name = tensor("op_131"), val = tensor([0, 2, 1, 3])]; tensor qk_1_transpose_x_0 = const()[name = tensor("qk_1_transpose_x_0"), val = tensor(false)]; tensor qk_1_transpose_y_0 = const()[name = tensor("qk_1_transpose_y_0"), val = tensor(false)]; tensor transpose_24_perm_0 = const()[name = tensor("transpose_24_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_25_perm_0 = const()[name = tensor("transpose_25_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_57 = transpose(perm = transpose_25_perm_0, x = k_3_cast_fp16)[name = tensor("transpose_57")]; tensor transpose_58 = transpose(perm = transpose_24_perm_0, x = q_3_cast_fp16)[name = tensor("transpose_58")]; tensor qk_1_cast_fp16 = matmul(transpose_x = qk_1_transpose_x_0, transpose_y = qk_1_transpose_y_0, x = transpose_58, y = transpose_57)[name = tensor("qk_1_cast_fp16")]; tensor var_135_cast_fp16 = softmax(axis = var_70, x = qk_1_cast_fp16)[name = tensor("op_135_cast_fp16")]; tensor var_137_transpose_x_0 = const()[name = tensor("op_137_transpose_x_0"), val = tensor(false)]; tensor var_137_transpose_y_0 = const()[name = tensor("op_137_transpose_y_0"), val = tensor(false)]; tensor transpose_59 = transpose(perm = var_131, x = var_130_cast_fp16)[name = tensor("transpose_59")]; tensor var_137_cast_fp16 = matmul(transpose_x = var_137_transpose_x_0, transpose_y = var_137_transpose_y_0, x = var_135_cast_fp16, y = transpose_59)[name = tensor("op_137_cast_fp16")]; tensor var_138 = const()[name = tensor("op_138"), val = tensor([0, 2, 1, 3])]; tensor concat_0 = const()[name = tensor("concat_0"), val = tensor([1, 1500, 512])]; tensor transpose_56 = transpose(perm = var_138, x = var_137_cast_fp16)[name = tensor("transpose_56")]; tensor x_11_cast_fp16 = reshape(shape = concat_0, x = transpose_56)[name = tensor("x_11_cast_fp16")]; tensor var_143_to_fp16 = const()[name = tensor("op_143_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4935552)))]; tensor var_144_to_fp16 = const()[name = tensor("op_144_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5459904)))]; tensor linear_3_cast_fp16 = linear(bias = var_144_to_fp16, weight = var_143_to_fp16, x = x_11_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor x_13_cast_fp16 = add(x = var_57_cast_fp16, y = linear_3_cast_fp16)[name = tensor("x_13_cast_fp16")]; tensor var_151_axes_0 = const()[name = tensor("op_151_axes_0"), val = tensor([-1])]; tensor blocks_0_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5460992)))]; tensor blocks_0_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5462080)))]; tensor var_151_cast_fp16 = layer_norm(axes = var_151_axes_0, beta = blocks_0_mlp_ln_bias_to_fp16, epsilon = var_76_to_fp16, gamma = blocks_0_mlp_ln_weight_to_fp16, x = x_13_cast_fp16)[name = tensor("op_151_cast_fp16")]; tensor var_160_to_fp16 = const()[name = tensor("op_160_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5463168)))]; tensor var_161_to_fp16 = const()[name = tensor("op_161_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7560384)))]; tensor linear_4_cast_fp16 = linear(bias = var_161_to_fp16, weight = var_160_to_fp16, x = var_151_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor x_17_mode_0 = const()[name = tensor("x_17_mode_0"), val = tensor("EXACT")]; tensor x_17_cast_fp16 = gelu(mode = x_17_mode_0, x = linear_4_cast_fp16)[name = tensor("x_17_cast_fp16")]; tensor var_166_to_fp16 = const()[name = tensor("op_166_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7564544)))]; tensor var_167_to_fp16 = const()[name = tensor("op_167_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9661760)))]; tensor linear_5_cast_fp16 = linear(bias = var_167_to_fp16, weight = var_166_to_fp16, x = x_17_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor x_19_cast_fp16 = add(x = x_13_cast_fp16, y = linear_5_cast_fp16)[name = tensor("x_19_cast_fp16")]; tensor var_177 = const()[name = tensor("op_177"), val = tensor(-1)]; tensor var_194_axes_0 = const()[name = tensor("op_194_axes_0"), val = tensor([-1])]; tensor blocks_1_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_1_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9662848)))]; tensor blocks_1_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_1_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9663936)))]; tensor var_183_to_fp16 = const()[name = tensor("op_183_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_194_cast_fp16 = layer_norm(axes = var_194_axes_0, beta = blocks_1_attn_ln_bias_to_fp16, epsilon = var_183_to_fp16, gamma = blocks_1_attn_ln_weight_to_fp16, x = x_19_cast_fp16)[name = tensor("op_194_cast_fp16")]; tensor var_205_to_fp16 = const()[name = tensor("op_205_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9665024)))]; tensor var_206_to_fp16 = const()[name = tensor("op_206_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10189376)))]; tensor linear_6_cast_fp16 = linear(bias = var_206_to_fp16, weight = var_205_to_fp16, x = var_194_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor var_209_to_fp16 = const()[name = tensor("op_209_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10190464)))]; tensor linear_7_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_209_to_fp16, x = var_194_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor var_213_to_fp16 = const()[name = tensor("op_213_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10714816)))]; tensor var_214_to_fp16 = const()[name = tensor("op_214_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11239168)))]; tensor linear_8_cast_fp16 = linear(bias = var_214_to_fp16, weight = var_213_to_fp16, x = var_194_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor var_222 = const()[name = tensor("op_222"), val = tensor([1, 1500, 8, -1])]; tensor var_223_cast_fp16 = reshape(shape = var_222, x = linear_6_cast_fp16)[name = tensor("op_223_cast_fp16")]; tensor const_44_to_fp16 = const()[name = tensor("const_44_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_7_cast_fp16 = mul(x = var_223_cast_fp16, y = const_44_to_fp16)[name = tensor("q_7_cast_fp16")]; tensor var_229 = const()[name = tensor("op_229"), val = tensor([1, 1500, 8, -1])]; tensor var_230_cast_fp16 = reshape(shape = var_229, x = linear_7_cast_fp16)[name = tensor("op_230_cast_fp16")]; tensor const_45_to_fp16 = const()[name = tensor("const_45_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_7_cast_fp16 = mul(x = var_230_cast_fp16, y = const_45_to_fp16)[name = tensor("k_7_cast_fp16")]; tensor var_236 = const()[name = tensor("op_236"), val = tensor([1, 1500, 8, -1])]; tensor var_237_cast_fp16 = reshape(shape = var_236, x = linear_8_cast_fp16)[name = tensor("op_237_cast_fp16")]; tensor var_238 = const()[name = tensor("op_238"), val = tensor([0, 2, 1, 3])]; tensor qk_3_transpose_x_0 = const()[name = tensor("qk_3_transpose_x_0"), val = tensor(false)]; tensor qk_3_transpose_y_0 = const()[name = tensor("qk_3_transpose_y_0"), val = tensor(false)]; tensor transpose_26_perm_0 = const()[name = tensor("transpose_26_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_27_perm_0 = const()[name = tensor("transpose_27_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_53 = transpose(perm = transpose_27_perm_0, x = k_7_cast_fp16)[name = tensor("transpose_53")]; tensor transpose_54 = transpose(perm = transpose_26_perm_0, x = q_7_cast_fp16)[name = tensor("transpose_54")]; tensor qk_3_cast_fp16 = matmul(transpose_x = qk_3_transpose_x_0, transpose_y = qk_3_transpose_y_0, x = transpose_54, y = transpose_53)[name = tensor("qk_3_cast_fp16")]; tensor var_242_cast_fp16 = softmax(axis = var_177, x = qk_3_cast_fp16)[name = tensor("op_242_cast_fp16")]; tensor var_244_transpose_x_0 = const()[name = tensor("op_244_transpose_x_0"), val = tensor(false)]; tensor var_244_transpose_y_0 = const()[name = tensor("op_244_transpose_y_0"), val = tensor(false)]; tensor transpose_55 = transpose(perm = var_238, x = var_237_cast_fp16)[name = tensor("transpose_55")]; tensor var_244_cast_fp16 = matmul(transpose_x = var_244_transpose_x_0, transpose_y = var_244_transpose_y_0, x = var_242_cast_fp16, y = transpose_55)[name = tensor("op_244_cast_fp16")]; tensor var_245 = const()[name = tensor("op_245"), val = tensor([0, 2, 1, 3])]; tensor concat_1 = const()[name = tensor("concat_1"), val = tensor([1, 1500, 512])]; tensor transpose_52 = transpose(perm = var_245, x = var_244_cast_fp16)[name = tensor("transpose_52")]; tensor x_23_cast_fp16 = reshape(shape = concat_1, x = transpose_52)[name = tensor("x_23_cast_fp16")]; tensor var_250_to_fp16 = const()[name = tensor("op_250_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11240256)))]; tensor var_251_to_fp16 = const()[name = tensor("op_251_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11764608)))]; tensor linear_9_cast_fp16 = linear(bias = var_251_to_fp16, weight = var_250_to_fp16, x = x_23_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor x_25_cast_fp16 = add(x = x_19_cast_fp16, y = linear_9_cast_fp16)[name = tensor("x_25_cast_fp16")]; tensor var_258_axes_0 = const()[name = tensor("op_258_axes_0"), val = tensor([-1])]; tensor blocks_1_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11765696)))]; tensor blocks_1_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11766784)))]; tensor var_258_cast_fp16 = layer_norm(axes = var_258_axes_0, beta = blocks_1_mlp_ln_bias_to_fp16, epsilon = var_183_to_fp16, gamma = blocks_1_mlp_ln_weight_to_fp16, x = x_25_cast_fp16)[name = tensor("op_258_cast_fp16")]; tensor var_267_to_fp16 = const()[name = tensor("op_267_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11767872)))]; tensor var_268_to_fp16 = const()[name = tensor("op_268_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13865088)))]; tensor linear_10_cast_fp16 = linear(bias = var_268_to_fp16, weight = var_267_to_fp16, x = var_258_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor x_29_mode_0 = const()[name = tensor("x_29_mode_0"), val = tensor("EXACT")]; tensor x_29_cast_fp16 = gelu(mode = x_29_mode_0, x = linear_10_cast_fp16)[name = tensor("x_29_cast_fp16")]; tensor var_273_to_fp16 = const()[name = tensor("op_273_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13869248)))]; tensor var_274_to_fp16 = const()[name = tensor("op_274_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15966464)))]; tensor linear_11_cast_fp16 = linear(bias = var_274_to_fp16, weight = var_273_to_fp16, x = x_29_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor x_31_cast_fp16 = add(x = x_25_cast_fp16, y = linear_11_cast_fp16)[name = tensor("x_31_cast_fp16")]; tensor var_284 = const()[name = tensor("op_284"), val = tensor(-1)]; tensor var_301_axes_0 = const()[name = tensor("op_301_axes_0"), val = tensor([-1])]; tensor blocks_2_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_2_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15967552)))]; tensor blocks_2_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_2_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15968640)))]; tensor var_290_to_fp16 = const()[name = tensor("op_290_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_301_cast_fp16 = layer_norm(axes = var_301_axes_0, beta = blocks_2_attn_ln_bias_to_fp16, epsilon = var_290_to_fp16, gamma = blocks_2_attn_ln_weight_to_fp16, x = x_31_cast_fp16)[name = tensor("op_301_cast_fp16")]; tensor var_312_to_fp16 = const()[name = tensor("op_312_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15969728)))]; tensor var_313_to_fp16 = const()[name = tensor("op_313_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16494080)))]; tensor linear_12_cast_fp16 = linear(bias = var_313_to_fp16, weight = var_312_to_fp16, x = var_301_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor var_316_to_fp16 = const()[name = tensor("op_316_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16495168)))]; tensor linear_13_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_316_to_fp16, x = var_301_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor var_320_to_fp16 = const()[name = tensor("op_320_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17019520)))]; tensor var_321_to_fp16 = const()[name = tensor("op_321_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17543872)))]; tensor linear_14_cast_fp16 = linear(bias = var_321_to_fp16, weight = var_320_to_fp16, x = var_301_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor var_329 = const()[name = tensor("op_329"), val = tensor([1, 1500, 8, -1])]; tensor var_330_cast_fp16 = reshape(shape = var_329, x = linear_12_cast_fp16)[name = tensor("op_330_cast_fp16")]; tensor const_46_to_fp16 = const()[name = tensor("const_46_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_11_cast_fp16 = mul(x = var_330_cast_fp16, y = const_46_to_fp16)[name = tensor("q_11_cast_fp16")]; tensor var_336 = const()[name = tensor("op_336"), val = tensor([1, 1500, 8, -1])]; tensor var_337_cast_fp16 = reshape(shape = var_336, x = linear_13_cast_fp16)[name = tensor("op_337_cast_fp16")]; tensor const_47_to_fp16 = const()[name = tensor("const_47_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_11_cast_fp16 = mul(x = var_337_cast_fp16, y = const_47_to_fp16)[name = tensor("k_11_cast_fp16")]; tensor var_343 = const()[name = tensor("op_343"), val = tensor([1, 1500, 8, -1])]; tensor var_344_cast_fp16 = reshape(shape = var_343, x = linear_14_cast_fp16)[name = tensor("op_344_cast_fp16")]; tensor var_345 = const()[name = tensor("op_345"), val = tensor([0, 2, 1, 3])]; tensor qk_5_transpose_x_0 = const()[name = tensor("qk_5_transpose_x_0"), val = tensor(false)]; tensor qk_5_transpose_y_0 = const()[name = tensor("qk_5_transpose_y_0"), val = tensor(false)]; tensor transpose_28_perm_0 = const()[name = tensor("transpose_28_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_29_perm_0 = const()[name = tensor("transpose_29_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_49 = transpose(perm = transpose_29_perm_0, x = k_11_cast_fp16)[name = tensor("transpose_49")]; tensor transpose_50 = transpose(perm = transpose_28_perm_0, x = q_11_cast_fp16)[name = tensor("transpose_50")]; tensor qk_5_cast_fp16 = matmul(transpose_x = qk_5_transpose_x_0, transpose_y = qk_5_transpose_y_0, x = transpose_50, y = transpose_49)[name = tensor("qk_5_cast_fp16")]; tensor var_349_cast_fp16 = softmax(axis = var_284, x = qk_5_cast_fp16)[name = tensor("op_349_cast_fp16")]; tensor var_351_transpose_x_0 = const()[name = tensor("op_351_transpose_x_0"), val = tensor(false)]; tensor var_351_transpose_y_0 = const()[name = tensor("op_351_transpose_y_0"), val = tensor(false)]; tensor transpose_51 = transpose(perm = var_345, x = var_344_cast_fp16)[name = tensor("transpose_51")]; tensor var_351_cast_fp16 = matmul(transpose_x = var_351_transpose_x_0, transpose_y = var_351_transpose_y_0, x = var_349_cast_fp16, y = transpose_51)[name = tensor("op_351_cast_fp16")]; tensor var_352 = const()[name = tensor("op_352"), val = tensor([0, 2, 1, 3])]; tensor concat_2 = const()[name = tensor("concat_2"), val = tensor([1, 1500, 512])]; tensor transpose_48 = transpose(perm = var_352, x = var_351_cast_fp16)[name = tensor("transpose_48")]; tensor x_35_cast_fp16 = reshape(shape = concat_2, x = transpose_48)[name = tensor("x_35_cast_fp16")]; tensor var_357_to_fp16 = const()[name = tensor("op_357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17544960)))]; tensor var_358_to_fp16 = const()[name = tensor("op_358_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18069312)))]; tensor linear_15_cast_fp16 = linear(bias = var_358_to_fp16, weight = var_357_to_fp16, x = x_35_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor x_37_cast_fp16 = add(x = x_31_cast_fp16, y = linear_15_cast_fp16)[name = tensor("x_37_cast_fp16")]; tensor var_365_axes_0 = const()[name = tensor("op_365_axes_0"), val = tensor([-1])]; tensor blocks_2_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18070400)))]; tensor blocks_2_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18071488)))]; tensor var_365_cast_fp16 = layer_norm(axes = var_365_axes_0, beta = blocks_2_mlp_ln_bias_to_fp16, epsilon = var_290_to_fp16, gamma = blocks_2_mlp_ln_weight_to_fp16, x = x_37_cast_fp16)[name = tensor("op_365_cast_fp16")]; tensor var_374_to_fp16 = const()[name = tensor("op_374_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18072576)))]; tensor var_375_to_fp16 = const()[name = tensor("op_375_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20169792)))]; tensor linear_16_cast_fp16 = linear(bias = var_375_to_fp16, weight = var_374_to_fp16, x = var_365_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor x_41_mode_0 = const()[name = tensor("x_41_mode_0"), val = tensor("EXACT")]; tensor x_41_cast_fp16 = gelu(mode = x_41_mode_0, x = linear_16_cast_fp16)[name = tensor("x_41_cast_fp16")]; tensor var_380_to_fp16 = const()[name = tensor("op_380_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20173952)))]; tensor var_381_to_fp16 = const()[name = tensor("op_381_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22271168)))]; tensor linear_17_cast_fp16 = linear(bias = var_381_to_fp16, weight = var_380_to_fp16, x = x_41_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor x_43_cast_fp16 = add(x = x_37_cast_fp16, y = linear_17_cast_fp16)[name = tensor("x_43_cast_fp16")]; tensor var_391 = const()[name = tensor("op_391"), val = tensor(-1)]; tensor var_408_axes_0 = const()[name = tensor("op_408_axes_0"), val = tensor([-1])]; tensor blocks_3_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_3_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22272256)))]; tensor blocks_3_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_3_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22273344)))]; tensor var_397_to_fp16 = const()[name = tensor("op_397_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_408_cast_fp16 = layer_norm(axes = var_408_axes_0, beta = blocks_3_attn_ln_bias_to_fp16, epsilon = var_397_to_fp16, gamma = blocks_3_attn_ln_weight_to_fp16, x = x_43_cast_fp16)[name = tensor("op_408_cast_fp16")]; tensor var_419_to_fp16 = const()[name = tensor("op_419_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22274432)))]; tensor var_420_to_fp16 = const()[name = tensor("op_420_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22798784)))]; tensor linear_18_cast_fp16 = linear(bias = var_420_to_fp16, weight = var_419_to_fp16, x = var_408_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor var_423_to_fp16 = const()[name = tensor("op_423_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22799872)))]; tensor linear_19_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_423_to_fp16, x = var_408_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor var_427_to_fp16 = const()[name = tensor("op_427_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23324224)))]; tensor var_428_to_fp16 = const()[name = tensor("op_428_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23848576)))]; tensor linear_20_cast_fp16 = linear(bias = var_428_to_fp16, weight = var_427_to_fp16, x = var_408_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor var_436 = const()[name = tensor("op_436"), val = tensor([1, 1500, 8, -1])]; tensor var_437_cast_fp16 = reshape(shape = var_436, x = linear_18_cast_fp16)[name = tensor("op_437_cast_fp16")]; tensor const_48_to_fp16 = const()[name = tensor("const_48_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_15_cast_fp16 = mul(x = var_437_cast_fp16, y = const_48_to_fp16)[name = tensor("q_15_cast_fp16")]; tensor var_443 = const()[name = tensor("op_443"), val = tensor([1, 1500, 8, -1])]; tensor var_444_cast_fp16 = reshape(shape = var_443, x = linear_19_cast_fp16)[name = tensor("op_444_cast_fp16")]; tensor const_49_to_fp16 = const()[name = tensor("const_49_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_15_cast_fp16 = mul(x = var_444_cast_fp16, y = const_49_to_fp16)[name = tensor("k_15_cast_fp16")]; tensor var_450 = const()[name = tensor("op_450"), val = tensor([1, 1500, 8, -1])]; tensor var_451_cast_fp16 = reshape(shape = var_450, x = linear_20_cast_fp16)[name = tensor("op_451_cast_fp16")]; tensor var_452 = const()[name = tensor("op_452"), val = tensor([0, 2, 1, 3])]; tensor qk_7_transpose_x_0 = const()[name = tensor("qk_7_transpose_x_0"), val = tensor(false)]; tensor qk_7_transpose_y_0 = const()[name = tensor("qk_7_transpose_y_0"), val = tensor(false)]; tensor transpose_30_perm_0 = const()[name = tensor("transpose_30_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_31_perm_0 = const()[name = tensor("transpose_31_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_45 = transpose(perm = transpose_31_perm_0, x = k_15_cast_fp16)[name = tensor("transpose_45")]; tensor transpose_46 = transpose(perm = transpose_30_perm_0, x = q_15_cast_fp16)[name = tensor("transpose_46")]; tensor qk_7_cast_fp16 = matmul(transpose_x = qk_7_transpose_x_0, transpose_y = qk_7_transpose_y_0, x = transpose_46, y = transpose_45)[name = tensor("qk_7_cast_fp16")]; tensor var_456_cast_fp16 = softmax(axis = var_391, x = qk_7_cast_fp16)[name = tensor("op_456_cast_fp16")]; tensor var_458_transpose_x_0 = const()[name = tensor("op_458_transpose_x_0"), val = tensor(false)]; tensor var_458_transpose_y_0 = const()[name = tensor("op_458_transpose_y_0"), val = tensor(false)]; tensor transpose_47 = transpose(perm = var_452, x = var_451_cast_fp16)[name = tensor("transpose_47")]; tensor var_458_cast_fp16 = matmul(transpose_x = var_458_transpose_x_0, transpose_y = var_458_transpose_y_0, x = var_456_cast_fp16, y = transpose_47)[name = tensor("op_458_cast_fp16")]; tensor var_459 = const()[name = tensor("op_459"), val = tensor([0, 2, 1, 3])]; tensor concat_3 = const()[name = tensor("concat_3"), val = tensor([1, 1500, 512])]; tensor transpose_44 = transpose(perm = var_459, x = var_458_cast_fp16)[name = tensor("transpose_44")]; tensor x_47_cast_fp16 = reshape(shape = concat_3, x = transpose_44)[name = tensor("x_47_cast_fp16")]; tensor var_464_to_fp16 = const()[name = tensor("op_464_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23849664)))]; tensor var_465_to_fp16 = const()[name = tensor("op_465_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24374016)))]; tensor linear_21_cast_fp16 = linear(bias = var_465_to_fp16, weight = var_464_to_fp16, x = x_47_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor x_49_cast_fp16 = add(x = x_43_cast_fp16, y = linear_21_cast_fp16)[name = tensor("x_49_cast_fp16")]; tensor var_472_axes_0 = const()[name = tensor("op_472_axes_0"), val = tensor([-1])]; tensor blocks_3_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24375104)))]; tensor blocks_3_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24376192)))]; tensor var_472_cast_fp16 = layer_norm(axes = var_472_axes_0, beta = blocks_3_mlp_ln_bias_to_fp16, epsilon = var_397_to_fp16, gamma = blocks_3_mlp_ln_weight_to_fp16, x = x_49_cast_fp16)[name = tensor("op_472_cast_fp16")]; tensor var_481_to_fp16 = const()[name = tensor("op_481_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24377280)))]; tensor var_482_to_fp16 = const()[name = tensor("op_482_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26474496)))]; tensor linear_22_cast_fp16 = linear(bias = var_482_to_fp16, weight = var_481_to_fp16, x = var_472_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor x_53_mode_0 = const()[name = tensor("x_53_mode_0"), val = tensor("EXACT")]; tensor x_53_cast_fp16 = gelu(mode = x_53_mode_0, x = linear_22_cast_fp16)[name = tensor("x_53_cast_fp16")]; tensor var_487_to_fp16 = const()[name = tensor("op_487_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26478656)))]; tensor var_488_to_fp16 = const()[name = tensor("op_488_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28575872)))]; tensor linear_23_cast_fp16 = linear(bias = var_488_to_fp16, weight = var_487_to_fp16, x = x_53_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor x_55_cast_fp16 = add(x = x_49_cast_fp16, y = linear_23_cast_fp16)[name = tensor("x_55_cast_fp16")]; tensor var_498 = const()[name = tensor("op_498"), val = tensor(-1)]; tensor var_515_axes_0 = const()[name = tensor("op_515_axes_0"), val = tensor([-1])]; tensor blocks_4_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_4_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28576960)))]; tensor blocks_4_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_4_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28578048)))]; tensor var_504_to_fp16 = const()[name = tensor("op_504_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_515_cast_fp16 = layer_norm(axes = var_515_axes_0, beta = blocks_4_attn_ln_bias_to_fp16, epsilon = var_504_to_fp16, gamma = blocks_4_attn_ln_weight_to_fp16, x = x_55_cast_fp16)[name = tensor("op_515_cast_fp16")]; tensor var_526_to_fp16 = const()[name = tensor("op_526_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28579136)))]; tensor var_527_to_fp16 = const()[name = tensor("op_527_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29103488)))]; tensor linear_24_cast_fp16 = linear(bias = var_527_to_fp16, weight = var_526_to_fp16, x = var_515_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor var_530_to_fp16 = const()[name = tensor("op_530_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29104576)))]; tensor linear_25_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_530_to_fp16, x = var_515_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor var_534_to_fp16 = const()[name = tensor("op_534_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29628928)))]; tensor var_535_to_fp16 = const()[name = tensor("op_535_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30153280)))]; tensor linear_26_cast_fp16 = linear(bias = var_535_to_fp16, weight = var_534_to_fp16, x = var_515_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor var_543 = const()[name = tensor("op_543"), val = tensor([1, 1500, 8, -1])]; tensor var_544_cast_fp16 = reshape(shape = var_543, x = linear_24_cast_fp16)[name = tensor("op_544_cast_fp16")]; tensor const_50_to_fp16 = const()[name = tensor("const_50_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_19_cast_fp16 = mul(x = var_544_cast_fp16, y = const_50_to_fp16)[name = tensor("q_19_cast_fp16")]; tensor var_550 = const()[name = tensor("op_550"), val = tensor([1, 1500, 8, -1])]; tensor var_551_cast_fp16 = reshape(shape = var_550, x = linear_25_cast_fp16)[name = tensor("op_551_cast_fp16")]; tensor const_51_to_fp16 = const()[name = tensor("const_51_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_19_cast_fp16 = mul(x = var_551_cast_fp16, y = const_51_to_fp16)[name = tensor("k_19_cast_fp16")]; tensor var_557 = const()[name = tensor("op_557"), val = tensor([1, 1500, 8, -1])]; tensor var_558_cast_fp16 = reshape(shape = var_557, x = linear_26_cast_fp16)[name = tensor("op_558_cast_fp16")]; tensor var_559 = const()[name = tensor("op_559"), val = tensor([0, 2, 1, 3])]; tensor qk_9_transpose_x_0 = const()[name = tensor("qk_9_transpose_x_0"), val = tensor(false)]; tensor qk_9_transpose_y_0 = const()[name = tensor("qk_9_transpose_y_0"), val = tensor(false)]; tensor transpose_32_perm_0 = const()[name = tensor("transpose_32_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_33_perm_0 = const()[name = tensor("transpose_33_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_41 = transpose(perm = transpose_33_perm_0, x = k_19_cast_fp16)[name = tensor("transpose_41")]; tensor transpose_42 = transpose(perm = transpose_32_perm_0, x = q_19_cast_fp16)[name = tensor("transpose_42")]; tensor qk_9_cast_fp16 = matmul(transpose_x = qk_9_transpose_x_0, transpose_y = qk_9_transpose_y_0, x = transpose_42, y = transpose_41)[name = tensor("qk_9_cast_fp16")]; tensor var_563_cast_fp16 = softmax(axis = var_498, x = qk_9_cast_fp16)[name = tensor("op_563_cast_fp16")]; tensor var_565_transpose_x_0 = const()[name = tensor("op_565_transpose_x_0"), val = tensor(false)]; tensor var_565_transpose_y_0 = const()[name = tensor("op_565_transpose_y_0"), val = tensor(false)]; tensor transpose_43 = transpose(perm = var_559, x = var_558_cast_fp16)[name = tensor("transpose_43")]; tensor var_565_cast_fp16 = matmul(transpose_x = var_565_transpose_x_0, transpose_y = var_565_transpose_y_0, x = var_563_cast_fp16, y = transpose_43)[name = tensor("op_565_cast_fp16")]; tensor var_566 = const()[name = tensor("op_566"), val = tensor([0, 2, 1, 3])]; tensor concat_4 = const()[name = tensor("concat_4"), val = tensor([1, 1500, 512])]; tensor transpose_40 = transpose(perm = var_566, x = var_565_cast_fp16)[name = tensor("transpose_40")]; tensor x_59_cast_fp16 = reshape(shape = concat_4, x = transpose_40)[name = tensor("x_59_cast_fp16")]; tensor var_571_to_fp16 = const()[name = tensor("op_571_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30154368)))]; tensor var_572_to_fp16 = const()[name = tensor("op_572_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30678720)))]; tensor linear_27_cast_fp16 = linear(bias = var_572_to_fp16, weight = var_571_to_fp16, x = x_59_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor x_61_cast_fp16 = add(x = x_55_cast_fp16, y = linear_27_cast_fp16)[name = tensor("x_61_cast_fp16")]; tensor var_579_axes_0 = const()[name = tensor("op_579_axes_0"), val = tensor([-1])]; tensor blocks_4_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30679808)))]; tensor blocks_4_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30680896)))]; tensor var_579_cast_fp16 = layer_norm(axes = var_579_axes_0, beta = blocks_4_mlp_ln_bias_to_fp16, epsilon = var_504_to_fp16, gamma = blocks_4_mlp_ln_weight_to_fp16, x = x_61_cast_fp16)[name = tensor("op_579_cast_fp16")]; tensor var_588_to_fp16 = const()[name = tensor("op_588_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30681984)))]; tensor var_589_to_fp16 = const()[name = tensor("op_589_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32779200)))]; tensor linear_28_cast_fp16 = linear(bias = var_589_to_fp16, weight = var_588_to_fp16, x = var_579_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor x_65_mode_0 = const()[name = tensor("x_65_mode_0"), val = tensor("EXACT")]; tensor x_65_cast_fp16 = gelu(mode = x_65_mode_0, x = linear_28_cast_fp16)[name = tensor("x_65_cast_fp16")]; tensor var_594_to_fp16 = const()[name = tensor("op_594_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32783360)))]; tensor var_595_to_fp16 = const()[name = tensor("op_595_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34880576)))]; tensor linear_29_cast_fp16 = linear(bias = var_595_to_fp16, weight = var_594_to_fp16, x = x_65_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor x_67_cast_fp16 = add(x = x_61_cast_fp16, y = linear_29_cast_fp16)[name = tensor("x_67_cast_fp16")]; tensor var_605 = const()[name = tensor("op_605"), val = tensor(-1)]; tensor var_622_axes_0 = const()[name = tensor("op_622_axes_0"), val = tensor([-1])]; tensor blocks_5_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_5_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34881664)))]; tensor blocks_5_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_5_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34882752)))]; tensor var_611_to_fp16 = const()[name = tensor("op_611_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_622_cast_fp16 = layer_norm(axes = var_622_axes_0, beta = blocks_5_attn_ln_bias_to_fp16, epsilon = var_611_to_fp16, gamma = blocks_5_attn_ln_weight_to_fp16, x = x_67_cast_fp16)[name = tensor("op_622_cast_fp16")]; tensor var_633_to_fp16 = const()[name = tensor("op_633_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34883840)))]; tensor var_634_to_fp16 = const()[name = tensor("op_634_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35408192)))]; tensor linear_30_cast_fp16 = linear(bias = var_634_to_fp16, weight = var_633_to_fp16, x = var_622_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor var_637_to_fp16 = const()[name = tensor("op_637_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35409280)))]; tensor linear_31_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_637_to_fp16, x = var_622_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor var_641_to_fp16 = const()[name = tensor("op_641_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35933632)))]; tensor var_642_to_fp16 = const()[name = tensor("op_642_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36457984)))]; tensor linear_32_cast_fp16 = linear(bias = var_642_to_fp16, weight = var_641_to_fp16, x = var_622_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor var_650 = const()[name = tensor("op_650"), val = tensor([1, 1500, 8, -1])]; tensor var_651_cast_fp16 = reshape(shape = var_650, x = linear_30_cast_fp16)[name = tensor("op_651_cast_fp16")]; tensor const_52_to_fp16 = const()[name = tensor("const_52_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_cast_fp16 = mul(x = var_651_cast_fp16, y = const_52_to_fp16)[name = tensor("q_cast_fp16")]; tensor var_657 = const()[name = tensor("op_657"), val = tensor([1, 1500, 8, -1])]; tensor var_658_cast_fp16 = reshape(shape = var_657, x = linear_31_cast_fp16)[name = tensor("op_658_cast_fp16")]; tensor const_53_to_fp16 = const()[name = tensor("const_53_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_cast_fp16 = mul(x = var_658_cast_fp16, y = const_53_to_fp16)[name = tensor("k_cast_fp16")]; tensor var_664 = const()[name = tensor("op_664"), val = tensor([1, 1500, 8, -1])]; tensor var_665_cast_fp16 = reshape(shape = var_664, x = linear_32_cast_fp16)[name = tensor("op_665_cast_fp16")]; tensor var_666 = const()[name = tensor("op_666"), val = tensor([0, 2, 1, 3])]; tensor qk_transpose_x_0 = const()[name = tensor("qk_transpose_x_0"), val = tensor(false)]; tensor qk_transpose_y_0 = const()[name = tensor("qk_transpose_y_0"), val = tensor(false)]; tensor transpose_34_perm_0 = const()[name = tensor("transpose_34_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_35_perm_0 = const()[name = tensor("transpose_35_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_37 = transpose(perm = transpose_35_perm_0, x = k_cast_fp16)[name = tensor("transpose_37")]; tensor transpose_38 = transpose(perm = transpose_34_perm_0, x = q_cast_fp16)[name = tensor("transpose_38")]; tensor qk_cast_fp16 = matmul(transpose_x = qk_transpose_x_0, transpose_y = qk_transpose_y_0, x = transpose_38, y = transpose_37)[name = tensor("qk_cast_fp16")]; tensor var_670_cast_fp16 = softmax(axis = var_605, x = qk_cast_fp16)[name = tensor("op_670_cast_fp16")]; tensor var_672_transpose_x_0 = const()[name = tensor("op_672_transpose_x_0"), val = tensor(false)]; tensor var_672_transpose_y_0 = const()[name = tensor("op_672_transpose_y_0"), val = tensor(false)]; tensor transpose_39 = transpose(perm = var_666, x = var_665_cast_fp16)[name = tensor("transpose_39")]; tensor var_672_cast_fp16 = matmul(transpose_x = var_672_transpose_x_0, transpose_y = var_672_transpose_y_0, x = var_670_cast_fp16, y = transpose_39)[name = tensor("op_672_cast_fp16")]; tensor var_673 = const()[name = tensor("op_673"), val = tensor([0, 2, 1, 3])]; tensor concat_5 = const()[name = tensor("concat_5"), val = tensor([1, 1500, 512])]; tensor transpose_36 = transpose(perm = var_673, x = var_672_cast_fp16)[name = tensor("transpose_36")]; tensor x_71_cast_fp16 = reshape(shape = concat_5, x = transpose_36)[name = tensor("x_71_cast_fp16")]; tensor var_678_to_fp16 = const()[name = tensor("op_678_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36459072)))]; tensor var_679_to_fp16 = const()[name = tensor("op_679_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36983424)))]; tensor linear_33_cast_fp16 = linear(bias = var_679_to_fp16, weight = var_678_to_fp16, x = x_71_cast_fp16)[name = tensor("linear_33_cast_fp16")]; tensor x_73_cast_fp16 = add(x = x_67_cast_fp16, y = linear_33_cast_fp16)[name = tensor("x_73_cast_fp16")]; tensor var_686_axes_0 = const()[name = tensor("op_686_axes_0"), val = tensor([-1])]; tensor blocks_5_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36984512)))]; tensor blocks_5_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36985600)))]; tensor var_686_cast_fp16 = layer_norm(axes = var_686_axes_0, beta = blocks_5_mlp_ln_bias_to_fp16, epsilon = var_611_to_fp16, gamma = blocks_5_mlp_ln_weight_to_fp16, x = x_73_cast_fp16)[name = tensor("op_686_cast_fp16")]; tensor var_695_to_fp16 = const()[name = tensor("op_695_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36986688)))]; tensor var_696_to_fp16 = const()[name = tensor("op_696_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39083904)))]; tensor linear_34_cast_fp16 = linear(bias = var_696_to_fp16, weight = var_695_to_fp16, x = var_686_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor x_77_mode_0 = const()[name = tensor("x_77_mode_0"), val = tensor("EXACT")]; tensor x_77_cast_fp16 = gelu(mode = x_77_mode_0, x = linear_34_cast_fp16)[name = tensor("x_77_cast_fp16")]; tensor var_701_to_fp16 = const()[name = tensor("op_701_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39088064)))]; tensor var_702_to_fp16 = const()[name = tensor("op_702_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41185280)))]; tensor linear_35_cast_fp16 = linear(bias = var_702_to_fp16, weight = var_701_to_fp16, x = x_77_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor x_cast_fp16 = add(x = x_73_cast_fp16, y = linear_35_cast_fp16)[name = tensor("x_cast_fp16")]; tensor var_716_axes_0 = const()[name = tensor("op_716_axes_0"), val = tensor([-1])]; tensor ln_post_weight_to_fp16 = const()[name = tensor("ln_post_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41186368)))]; tensor ln_post_bias_to_fp16 = const()[name = tensor("ln_post_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41187456)))]; tensor var_707_to_fp16 = const()[name = tensor("op_707_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_716_cast_fp16 = layer_norm(axes = var_716_axes_0, beta = ln_post_bias_to_fp16, epsilon = var_707_to_fp16, gamma = ln_post_weight_to_fp16, x = x_cast_fp16)[name = tensor("op_716_cast_fp16")]; tensor var_716_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_716_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor output = cast(dtype = var_716_cast_fp16_to_fp32_dtype_0, x = var_716_cast_fp16)[name = tensor("cast_36")]; } -> (output); }