program(1.3) [buildInfo = dict({{"coremlc-component-MIL", "3400.43.1"}, {"coremlc-version", "3400.58.2"}})] { func main(tensor logmel_data) { string var_84_pad_type_0 = const()[name = string("op_84_pad_type_0"), val = string("custom")]; tensor var_84_pad_0 = const()[name = string("op_84_pad_0"), val = tensor([1, 1])]; tensor var_84_strides_0 = const()[name = string("op_84_strides_0"), val = tensor([1])]; tensor var_84_dilations_0 = const()[name = string("op_84_dilations_0"), val = tensor([1])]; int32 var_84_groups_0 = const()[name = string("op_84_groups_0"), val = int32(1)]; tensor weight_3_to_fp16 = const()[name = string("weight_3_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(64)))]; tensor bias_3_to_fp16 = const()[name = string("bias_3_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(614528)))]; tensor var_84_cast_fp16 = conv(bias = bias_3_to_fp16, dilations = var_84_dilations_0, groups = var_84_groups_0, pad = var_84_pad_0, pad_type = var_84_pad_type_0, strides = var_84_strides_0, weight = weight_3_to_fp16, x = logmel_data)[name = string("op_84_cast_fp16")]; string input_1_mode_0 = const()[name = string("input_1_mode_0"), val = string("EXACT")]; tensor input_1_cast_fp16 = gelu(mode = input_1_mode_0, x = var_84_cast_fp16)[name = string("input_1_cast_fp16")]; string var_102_pad_type_0 = const()[name = string("op_102_pad_type_0"), val = string("custom")]; tensor var_102_pad_0 = const()[name = string("op_102_pad_0"), val = tensor([1, 1])]; tensor var_102_strides_0 = const()[name = string("op_102_strides_0"), val = tensor([2])]; tensor var_102_dilations_0 = const()[name = string("op_102_dilations_0"), val = tensor([1])]; int32 var_102_groups_0 = const()[name = string("op_102_groups_0"), val = int32(1)]; tensor weight_7_to_fp16 = const()[name = string("weight_7_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(617152)))]; tensor bias_7_to_fp16 = const()[name = string("bias_7_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(10447616)))]; tensor var_102_cast_fp16 = conv(bias = bias_7_to_fp16, dilations = var_102_dilations_0, groups = var_102_groups_0, pad = var_102_pad_0, pad_type = var_102_pad_type_0, strides = var_102_strides_0, weight = weight_7_to_fp16, x = input_1_cast_fp16)[name = string("op_102_cast_fp16")]; string x_3_mode_0 = const()[name = string("x_3_mode_0"), val = string("EXACT")]; tensor x_3_cast_fp16 = gelu(mode = x_3_mode_0, x = var_102_cast_fp16)[name = string("x_3_cast_fp16")]; tensor var_108 = const()[name = string("op_108"), val = tensor([0, 2, 1])]; tensor positional_embedding_to_fp16 = const()[name = string("positional_embedding_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(10450240)))]; tensor x_5_cast_fp16 = transpose(perm = var_108, x = x_3_cast_fp16)[name = string("transpose_160")]; tensor var_111_cast_fp16 = add(x = x_5_cast_fp16, y = positional_embedding_to_fp16)[name = string("op_111_cast_fp16")]; int32 var_124 = const()[name = string("op_124"), val = int32(-1)]; tensor var_140_axes_0 = const()[name = string("op_140_axes_0"), val = tensor([-1])]; tensor blocks_0_attn_ln_weight_to_fp16 = const()[name = string("blocks_0_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(14290304)))]; tensor blocks_0_attn_ln_bias_to_fp16 = const()[name = string("blocks_0_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(14292928)))]; fp16 var_130_to_fp16 = const()[name = string("op_130_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_140_cast_fp16 = layer_norm(axes = var_140_axes_0, beta = blocks_0_attn_ln_bias_to_fp16, epsilon = var_130_to_fp16, gamma = blocks_0_attn_ln_weight_to_fp16, x = var_111_cast_fp16)[name = string("op_140_cast_fp16")]; tensor var_151_to_fp16 = const()[name = string("op_151_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(14295552)))]; tensor var_152_to_fp16 = const()[name = string("op_152_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(17572416)))]; tensor linear_0_cast_fp16 = linear(bias = var_152_to_fp16, weight = var_151_to_fp16, x = var_140_cast_fp16)[name = string("linear_0_cast_fp16")]; tensor var_155_to_fp16 = const()[name = string("op_155_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(17575040)))]; tensor linear_1_bias_0_to_fp16 = const()[name = string("linear_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(20851904)))]; tensor linear_1_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_155_to_fp16, x = var_140_cast_fp16)[name = string("linear_1_cast_fp16")]; tensor var_159_to_fp16 = const()[name = string("op_159_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(20854528)))]; tensor var_160_to_fp16 = const()[name = string("op_160_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(24131392)))]; tensor linear_2_cast_fp16 = linear(bias = var_160_to_fp16, weight = var_159_to_fp16, x = var_140_cast_fp16)[name = string("linear_2_cast_fp16")]; tensor var_168 = const()[name = string("op_168"), val = tensor([1, 1500, 20, -1])]; tensor var_169_cast_fp16 = reshape(shape = var_168, x = linear_0_cast_fp16)[name = string("op_169_cast_fp16")]; tensor const_224_to_fp16 = const()[name = string("const_224_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_3_cast_fp16 = mul(x = var_169_cast_fp16, y = const_224_to_fp16)[name = string("q_3_cast_fp16")]; tensor var_175 = const()[name = string("op_175"), val = tensor([1, 1500, 20, -1])]; tensor var_176_cast_fp16 = reshape(shape = var_175, x = linear_1_cast_fp16)[name = string("op_176_cast_fp16")]; tensor const_225_to_fp16 = const()[name = string("const_225_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_3_cast_fp16 = mul(x = var_176_cast_fp16, y = const_225_to_fp16)[name = string("k_3_cast_fp16")]; tensor var_182 = const()[name = string("op_182"), val = tensor([1, 1500, 20, -1])]; tensor var_183_cast_fp16 = reshape(shape = var_182, x = linear_2_cast_fp16)[name = string("op_183_cast_fp16")]; tensor var_184 = const()[name = string("op_184"), val = tensor([0, 2, -3, -1])]; bool qk_1_transpose_x_0 = const()[name = string("qk_1_transpose_x_0"), val = bool(false)]; bool qk_1_transpose_y_0 = const()[name = string("qk_1_transpose_y_0"), val = bool(false)]; tensor transpose_64_perm_0 = const()[name = string("transpose_64_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_65_perm_0 = const()[name = string("transpose_65_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_65 = transpose(perm = transpose_65_perm_0, x = k_3_cast_fp16)[name = string("transpose_158")]; tensor transpose_64 = transpose(perm = transpose_64_perm_0, x = q_3_cast_fp16)[name = string("transpose_159")]; tensor qk_1_cast_fp16 = matmul(transpose_x = qk_1_transpose_x_0, transpose_y = qk_1_transpose_y_0, x = transpose_64, y = transpose_65)[name = string("qk_1_cast_fp16")]; tensor var_188_cast_fp16 = softmax(axis = var_124, x = qk_1_cast_fp16)[name = string("op_188_cast_fp16")]; bool var_190_transpose_x_0 = const()[name = string("op_190_transpose_x_0"), val = bool(false)]; bool var_190_transpose_y_0 = const()[name = string("op_190_transpose_y_0"), val = bool(false)]; tensor v_3_cast_fp16 = transpose(perm = var_184, x = var_183_cast_fp16)[name = string("transpose_157")]; tensor var_190_cast_fp16 = matmul(transpose_x = var_190_transpose_x_0, transpose_y = var_190_transpose_y_0, x = var_188_cast_fp16, y = v_3_cast_fp16)[name = string("op_190_cast_fp16")]; tensor var_191 = const()[name = string("op_191"), val = tensor([0, 2, 1, 3])]; tensor concat_0 = const()[name = string("concat_0"), val = tensor([1, 1500, 1280])]; tensor var_192_cast_fp16 = transpose(perm = var_191, x = var_190_cast_fp16)[name = string("transpose_156")]; tensor x_11_cast_fp16 = reshape(shape = concat_0, x = var_192_cast_fp16)[name = string("x_11_cast_fp16")]; tensor var_196_to_fp16 = const()[name = string("op_196_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(24134016)))]; tensor var_197_to_fp16 = const()[name = string("op_197_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(27410880)))]; tensor linear_3_cast_fp16 = linear(bias = var_197_to_fp16, weight = var_196_to_fp16, x = x_11_cast_fp16)[name = string("linear_3_cast_fp16")]; tensor x_13_cast_fp16 = add(x = var_111_cast_fp16, y = linear_3_cast_fp16)[name = string("x_13_cast_fp16")]; tensor var_204_axes_0 = const()[name = string("op_204_axes_0"), val = tensor([-1])]; tensor blocks_0_mlp_ln_weight_to_fp16 = const()[name = string("blocks_0_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(27413504)))]; tensor blocks_0_mlp_ln_bias_to_fp16 = const()[name = string("blocks_0_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(27416128)))]; tensor var_204_cast_fp16 = layer_norm(axes = var_204_axes_0, beta = blocks_0_mlp_ln_bias_to_fp16, epsilon = var_130_to_fp16, gamma = blocks_0_mlp_ln_weight_to_fp16, x = x_13_cast_fp16)[name = string("op_204_cast_fp16")]; tensor var_213_to_fp16 = const()[name = string("op_213_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(27418752)))]; tensor var_214_to_fp16 = const()[name = string("op_214_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(40526016)))]; tensor linear_4_cast_fp16 = linear(bias = var_214_to_fp16, weight = var_213_to_fp16, x = var_204_cast_fp16)[name = string("linear_4_cast_fp16")]; string x_17_mode_0 = const()[name = string("x_17_mode_0"), val = string("EXACT")]; tensor x_17_cast_fp16 = gelu(mode = x_17_mode_0, x = linear_4_cast_fp16)[name = string("x_17_cast_fp16")]; tensor var_219_to_fp16 = const()[name = string("op_219_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(40536320)))]; tensor var_220_to_fp16 = const()[name = string("op_220_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(53643584)))]; tensor linear_5_cast_fp16 = linear(bias = var_220_to_fp16, weight = var_219_to_fp16, x = x_17_cast_fp16)[name = string("linear_5_cast_fp16")]; tensor x_19_cast_fp16 = add(x = x_13_cast_fp16, y = linear_5_cast_fp16)[name = string("x_19_cast_fp16")]; int32 var_230 = const()[name = string("op_230"), val = int32(-1)]; tensor var_246_axes_0 = const()[name = string("op_246_axes_0"), val = tensor([-1])]; tensor blocks_1_attn_ln_weight_to_fp16 = const()[name = string("blocks_1_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(53646208)))]; tensor blocks_1_attn_ln_bias_to_fp16 = const()[name = string("blocks_1_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(53648832)))]; fp16 var_236_to_fp16 = const()[name = string("op_236_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_246_cast_fp16 = layer_norm(axes = var_246_axes_0, beta = blocks_1_attn_ln_bias_to_fp16, epsilon = var_236_to_fp16, gamma = blocks_1_attn_ln_weight_to_fp16, x = x_19_cast_fp16)[name = string("op_246_cast_fp16")]; tensor var_257_to_fp16 = const()[name = string("op_257_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(53651456)))]; tensor var_258_to_fp16 = const()[name = string("op_258_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(56928320)))]; tensor linear_6_cast_fp16 = linear(bias = var_258_to_fp16, weight = var_257_to_fp16, x = var_246_cast_fp16)[name = string("linear_6_cast_fp16")]; tensor var_261_to_fp16 = const()[name = string("op_261_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(56930944)))]; tensor linear_7_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_261_to_fp16, x = var_246_cast_fp16)[name = string("linear_7_cast_fp16")]; tensor var_265_to_fp16 = const()[name = string("op_265_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(60207808)))]; tensor var_266_to_fp16 = const()[name = string("op_266_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(63484672)))]; tensor linear_8_cast_fp16 = linear(bias = var_266_to_fp16, weight = var_265_to_fp16, x = var_246_cast_fp16)[name = string("linear_8_cast_fp16")]; tensor var_274 = const()[name = string("op_274"), val = tensor([1, 1500, 20, -1])]; tensor var_275_cast_fp16 = reshape(shape = var_274, x = linear_6_cast_fp16)[name = string("op_275_cast_fp16")]; tensor const_226_to_fp16 = const()[name = string("const_226_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_7_cast_fp16 = mul(x = var_275_cast_fp16, y = const_226_to_fp16)[name = string("q_7_cast_fp16")]; tensor var_281 = const()[name = string("op_281"), val = tensor([1, 1500, 20, -1])]; tensor var_282_cast_fp16 = reshape(shape = var_281, x = linear_7_cast_fp16)[name = string("op_282_cast_fp16")]; tensor const_227_to_fp16 = const()[name = string("const_227_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_7_cast_fp16 = mul(x = var_282_cast_fp16, y = const_227_to_fp16)[name = string("k_7_cast_fp16")]; tensor var_288 = const()[name = string("op_288"), val = tensor([1, 1500, 20, -1])]; tensor var_289_cast_fp16 = reshape(shape = var_288, x = linear_8_cast_fp16)[name = string("op_289_cast_fp16")]; tensor var_290 = const()[name = string("op_290"), val = tensor([0, 2, -3, -1])]; bool qk_3_transpose_x_0 = const()[name = string("qk_3_transpose_x_0"), val = bool(false)]; bool qk_3_transpose_y_0 = const()[name = string("qk_3_transpose_y_0"), val = bool(false)]; tensor transpose_66_perm_0 = const()[name = string("transpose_66_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_67_perm_0 = const()[name = string("transpose_67_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_67 = transpose(perm = transpose_67_perm_0, x = k_7_cast_fp16)[name = string("transpose_154")]; tensor transpose_66 = transpose(perm = transpose_66_perm_0, x = q_7_cast_fp16)[name = string("transpose_155")]; tensor qk_3_cast_fp16 = matmul(transpose_x = qk_3_transpose_x_0, transpose_y = qk_3_transpose_y_0, x = transpose_66, y = transpose_67)[name = string("qk_3_cast_fp16")]; tensor var_294_cast_fp16 = softmax(axis = var_230, x = qk_3_cast_fp16)[name = string("op_294_cast_fp16")]; bool var_296_transpose_x_0 = const()[name = string("op_296_transpose_x_0"), val = bool(false)]; bool var_296_transpose_y_0 = const()[name = string("op_296_transpose_y_0"), val = bool(false)]; tensor v_7_cast_fp16 = transpose(perm = var_290, x = var_289_cast_fp16)[name = string("transpose_153")]; tensor var_296_cast_fp16 = matmul(transpose_x = var_296_transpose_x_0, transpose_y = var_296_transpose_y_0, x = var_294_cast_fp16, y = v_7_cast_fp16)[name = string("op_296_cast_fp16")]; tensor var_297 = const()[name = string("op_297"), val = tensor([0, 2, 1, 3])]; tensor concat_1 = const()[name = string("concat_1"), val = tensor([1, 1500, 1280])]; tensor var_298_cast_fp16 = transpose(perm = var_297, x = var_296_cast_fp16)[name = string("transpose_152")]; tensor x_23_cast_fp16 = reshape(shape = concat_1, x = var_298_cast_fp16)[name = string("x_23_cast_fp16")]; tensor var_302_to_fp16 = const()[name = string("op_302_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(63487296)))]; tensor var_303_to_fp16 = const()[name = string("op_303_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(66764160)))]; tensor linear_9_cast_fp16 = linear(bias = var_303_to_fp16, weight = var_302_to_fp16, x = x_23_cast_fp16)[name = string("linear_9_cast_fp16")]; tensor x_25_cast_fp16 = add(x = x_19_cast_fp16, y = linear_9_cast_fp16)[name = string("x_25_cast_fp16")]; tensor var_310_axes_0 = const()[name = string("op_310_axes_0"), val = tensor([-1])]; tensor blocks_1_mlp_ln_weight_to_fp16 = const()[name = string("blocks_1_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(66766784)))]; tensor blocks_1_mlp_ln_bias_to_fp16 = const()[name = string("blocks_1_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(66769408)))]; tensor var_310_cast_fp16 = layer_norm(axes = var_310_axes_0, beta = blocks_1_mlp_ln_bias_to_fp16, epsilon = var_236_to_fp16, gamma = blocks_1_mlp_ln_weight_to_fp16, x = x_25_cast_fp16)[name = string("op_310_cast_fp16")]; tensor var_319_to_fp16 = const()[name = string("op_319_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(66772032)))]; tensor var_320_to_fp16 = const()[name = string("op_320_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(79879296)))]; tensor linear_10_cast_fp16 = linear(bias = var_320_to_fp16, weight = var_319_to_fp16, x = var_310_cast_fp16)[name = string("linear_10_cast_fp16")]; string x_29_mode_0 = const()[name = string("x_29_mode_0"), val = string("EXACT")]; tensor x_29_cast_fp16 = gelu(mode = x_29_mode_0, x = linear_10_cast_fp16)[name = string("x_29_cast_fp16")]; tensor var_325_to_fp16 = const()[name = string("op_325_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(79889600)))]; tensor var_326_to_fp16 = const()[name = string("op_326_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(92996864)))]; tensor linear_11_cast_fp16 = linear(bias = var_326_to_fp16, weight = var_325_to_fp16, x = x_29_cast_fp16)[name = string("linear_11_cast_fp16")]; tensor x_31_cast_fp16 = add(x = x_25_cast_fp16, y = linear_11_cast_fp16)[name = string("x_31_cast_fp16")]; int32 var_336 = const()[name = string("op_336"), val = int32(-1)]; tensor var_352_axes_0 = const()[name = string("op_352_axes_0"), val = tensor([-1])]; tensor blocks_2_attn_ln_weight_to_fp16 = const()[name = string("blocks_2_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(92999488)))]; tensor blocks_2_attn_ln_bias_to_fp16 = const()[name = string("blocks_2_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(93002112)))]; fp16 var_342_to_fp16 = const()[name = string("op_342_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_352_cast_fp16 = layer_norm(axes = var_352_axes_0, beta = blocks_2_attn_ln_bias_to_fp16, epsilon = var_342_to_fp16, gamma = blocks_2_attn_ln_weight_to_fp16, x = x_31_cast_fp16)[name = string("op_352_cast_fp16")]; tensor var_363_to_fp16 = const()[name = string("op_363_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(93004736)))]; tensor var_364_to_fp16 = const()[name = string("op_364_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(96281600)))]; tensor linear_12_cast_fp16 = linear(bias = var_364_to_fp16, weight = var_363_to_fp16, x = var_352_cast_fp16)[name = string("linear_12_cast_fp16")]; tensor var_367_to_fp16 = const()[name = string("op_367_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(96284224)))]; tensor linear_13_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_367_to_fp16, x = var_352_cast_fp16)[name = string("linear_13_cast_fp16")]; tensor var_371_to_fp16 = const()[name = string("op_371_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(99561088)))]; tensor var_372_to_fp16 = const()[name = string("op_372_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(102837952)))]; tensor linear_14_cast_fp16 = linear(bias = var_372_to_fp16, weight = var_371_to_fp16, x = var_352_cast_fp16)[name = string("linear_14_cast_fp16")]; tensor var_380 = const()[name = string("op_380"), val = tensor([1, 1500, 20, -1])]; tensor var_381_cast_fp16 = reshape(shape = var_380, x = linear_12_cast_fp16)[name = string("op_381_cast_fp16")]; tensor const_228_to_fp16 = const()[name = string("const_228_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_11_cast_fp16 = mul(x = var_381_cast_fp16, y = const_228_to_fp16)[name = string("q_11_cast_fp16")]; tensor var_387 = const()[name = string("op_387"), val = tensor([1, 1500, 20, -1])]; tensor var_388_cast_fp16 = reshape(shape = var_387, x = linear_13_cast_fp16)[name = string("op_388_cast_fp16")]; tensor const_229_to_fp16 = const()[name = string("const_229_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_11_cast_fp16 = mul(x = var_388_cast_fp16, y = const_229_to_fp16)[name = string("k_11_cast_fp16")]; tensor var_394 = const()[name = string("op_394"), val = tensor([1, 1500, 20, -1])]; tensor var_395_cast_fp16 = reshape(shape = var_394, x = linear_14_cast_fp16)[name = string("op_395_cast_fp16")]; tensor var_396 = const()[name = string("op_396"), val = tensor([0, 2, -3, -1])]; bool qk_5_transpose_x_0 = const()[name = string("qk_5_transpose_x_0"), val = bool(false)]; bool qk_5_transpose_y_0 = const()[name = string("qk_5_transpose_y_0"), val = bool(false)]; tensor transpose_68_perm_0 = const()[name = string("transpose_68_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_69_perm_0 = const()[name = string("transpose_69_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_69 = transpose(perm = transpose_69_perm_0, x = k_11_cast_fp16)[name = string("transpose_150")]; tensor transpose_68 = transpose(perm = transpose_68_perm_0, x = q_11_cast_fp16)[name = string("transpose_151")]; tensor qk_5_cast_fp16 = matmul(transpose_x = qk_5_transpose_x_0, transpose_y = qk_5_transpose_y_0, x = transpose_68, y = transpose_69)[name = string("qk_5_cast_fp16")]; tensor var_400_cast_fp16 = softmax(axis = var_336, x = qk_5_cast_fp16)[name = string("op_400_cast_fp16")]; bool var_402_transpose_x_0 = const()[name = string("op_402_transpose_x_0"), val = bool(false)]; bool var_402_transpose_y_0 = const()[name = string("op_402_transpose_y_0"), val = bool(false)]; tensor v_11_cast_fp16 = transpose(perm = var_396, x = var_395_cast_fp16)[name = string("transpose_149")]; tensor var_402_cast_fp16 = matmul(transpose_x = var_402_transpose_x_0, transpose_y = var_402_transpose_y_0, x = var_400_cast_fp16, y = v_11_cast_fp16)[name = string("op_402_cast_fp16")]; tensor var_403 = const()[name = string("op_403"), val = tensor([0, 2, 1, 3])]; tensor concat_2 = const()[name = string("concat_2"), val = tensor([1, 1500, 1280])]; tensor var_404_cast_fp16 = transpose(perm = var_403, x = var_402_cast_fp16)[name = string("transpose_148")]; tensor x_35_cast_fp16 = reshape(shape = concat_2, x = var_404_cast_fp16)[name = string("x_35_cast_fp16")]; tensor var_408_to_fp16 = const()[name = string("op_408_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(102840576)))]; tensor var_409_to_fp16 = const()[name = string("op_409_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(106117440)))]; tensor linear_15_cast_fp16 = linear(bias = var_409_to_fp16, weight = var_408_to_fp16, x = x_35_cast_fp16)[name = string("linear_15_cast_fp16")]; tensor x_37_cast_fp16 = add(x = x_31_cast_fp16, y = linear_15_cast_fp16)[name = string("x_37_cast_fp16")]; tensor var_416_axes_0 = const()[name = string("op_416_axes_0"), val = tensor([-1])]; tensor blocks_2_mlp_ln_weight_to_fp16 = const()[name = string("blocks_2_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(106120064)))]; tensor blocks_2_mlp_ln_bias_to_fp16 = const()[name = string("blocks_2_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(106122688)))]; tensor var_416_cast_fp16 = layer_norm(axes = var_416_axes_0, beta = blocks_2_mlp_ln_bias_to_fp16, epsilon = var_342_to_fp16, gamma = blocks_2_mlp_ln_weight_to_fp16, x = x_37_cast_fp16)[name = string("op_416_cast_fp16")]; tensor var_425_to_fp16 = const()[name = string("op_425_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(106125312)))]; tensor var_426_to_fp16 = const()[name = string("op_426_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(119232576)))]; tensor linear_16_cast_fp16 = linear(bias = var_426_to_fp16, weight = var_425_to_fp16, x = var_416_cast_fp16)[name = string("linear_16_cast_fp16")]; string x_41_mode_0 = const()[name = string("x_41_mode_0"), val = string("EXACT")]; tensor x_41_cast_fp16 = gelu(mode = x_41_mode_0, x = linear_16_cast_fp16)[name = string("x_41_cast_fp16")]; tensor var_431_to_fp16 = const()[name = string("op_431_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(119242880)))]; tensor var_432_to_fp16 = const()[name = string("op_432_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(132350144)))]; tensor linear_17_cast_fp16 = linear(bias = var_432_to_fp16, weight = var_431_to_fp16, x = x_41_cast_fp16)[name = string("linear_17_cast_fp16")]; tensor x_43_cast_fp16 = add(x = x_37_cast_fp16, y = linear_17_cast_fp16)[name = string("x_43_cast_fp16")]; int32 var_442 = const()[name = string("op_442"), val = int32(-1)]; tensor var_458_axes_0 = const()[name = string("op_458_axes_0"), val = tensor([-1])]; tensor blocks_3_attn_ln_weight_to_fp16 = const()[name = string("blocks_3_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(132352768)))]; tensor blocks_3_attn_ln_bias_to_fp16 = const()[name = string("blocks_3_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(132355392)))]; fp16 var_448_to_fp16 = const()[name = string("op_448_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_458_cast_fp16 = layer_norm(axes = var_458_axes_0, beta = blocks_3_attn_ln_bias_to_fp16, epsilon = var_448_to_fp16, gamma = blocks_3_attn_ln_weight_to_fp16, x = x_43_cast_fp16)[name = string("op_458_cast_fp16")]; tensor var_469_to_fp16 = const()[name = string("op_469_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(132358016)))]; tensor var_470_to_fp16 = const()[name = string("op_470_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(135634880)))]; tensor linear_18_cast_fp16 = linear(bias = var_470_to_fp16, weight = var_469_to_fp16, x = var_458_cast_fp16)[name = string("linear_18_cast_fp16")]; tensor var_473_to_fp16 = const()[name = string("op_473_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(135637504)))]; tensor linear_19_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_473_to_fp16, x = var_458_cast_fp16)[name = string("linear_19_cast_fp16")]; tensor var_477_to_fp16 = const()[name = string("op_477_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(138914368)))]; tensor var_478_to_fp16 = const()[name = string("op_478_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(142191232)))]; tensor linear_20_cast_fp16 = linear(bias = var_478_to_fp16, weight = var_477_to_fp16, x = var_458_cast_fp16)[name = string("linear_20_cast_fp16")]; tensor var_486 = const()[name = string("op_486"), val = tensor([1, 1500, 20, -1])]; tensor var_487_cast_fp16 = reshape(shape = var_486, x = linear_18_cast_fp16)[name = string("op_487_cast_fp16")]; tensor const_230_to_fp16 = const()[name = string("const_230_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_15_cast_fp16 = mul(x = var_487_cast_fp16, y = const_230_to_fp16)[name = string("q_15_cast_fp16")]; tensor var_493 = const()[name = string("op_493"), val = tensor([1, 1500, 20, -1])]; tensor var_494_cast_fp16 = reshape(shape = var_493, x = linear_19_cast_fp16)[name = string("op_494_cast_fp16")]; tensor const_231_to_fp16 = const()[name = string("const_231_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_15_cast_fp16 = mul(x = var_494_cast_fp16, y = const_231_to_fp16)[name = string("k_15_cast_fp16")]; tensor var_500 = const()[name = string("op_500"), val = tensor([1, 1500, 20, -1])]; tensor var_501_cast_fp16 = reshape(shape = var_500, x = linear_20_cast_fp16)[name = string("op_501_cast_fp16")]; tensor var_502 = const()[name = string("op_502"), val = tensor([0, 2, -3, -1])]; bool qk_7_transpose_x_0 = const()[name = string("qk_7_transpose_x_0"), val = bool(false)]; bool qk_7_transpose_y_0 = const()[name = string("qk_7_transpose_y_0"), val = bool(false)]; tensor transpose_70_perm_0 = const()[name = string("transpose_70_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_71_perm_0 = const()[name = string("transpose_71_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_71 = transpose(perm = transpose_71_perm_0, x = k_15_cast_fp16)[name = string("transpose_146")]; tensor transpose_70 = transpose(perm = transpose_70_perm_0, x = q_15_cast_fp16)[name = string("transpose_147")]; tensor qk_7_cast_fp16 = matmul(transpose_x = qk_7_transpose_x_0, transpose_y = qk_7_transpose_y_0, x = transpose_70, y = transpose_71)[name = string("qk_7_cast_fp16")]; tensor var_506_cast_fp16 = softmax(axis = var_442, x = qk_7_cast_fp16)[name = string("op_506_cast_fp16")]; bool var_508_transpose_x_0 = const()[name = string("op_508_transpose_x_0"), val = bool(false)]; bool var_508_transpose_y_0 = const()[name = string("op_508_transpose_y_0"), val = bool(false)]; tensor v_15_cast_fp16 = transpose(perm = var_502, x = var_501_cast_fp16)[name = string("transpose_145")]; tensor var_508_cast_fp16 = matmul(transpose_x = var_508_transpose_x_0, transpose_y = var_508_transpose_y_0, x = var_506_cast_fp16, y = v_15_cast_fp16)[name = string("op_508_cast_fp16")]; tensor var_509 = const()[name = string("op_509"), val = tensor([0, 2, 1, 3])]; tensor concat_3 = const()[name = string("concat_3"), val = tensor([1, 1500, 1280])]; tensor var_510_cast_fp16 = transpose(perm = var_509, x = var_508_cast_fp16)[name = string("transpose_144")]; tensor x_47_cast_fp16 = reshape(shape = concat_3, x = var_510_cast_fp16)[name = string("x_47_cast_fp16")]; tensor var_514_to_fp16 = const()[name = string("op_514_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(142193856)))]; tensor var_515_to_fp16 = const()[name = string("op_515_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(145470720)))]; tensor linear_21_cast_fp16 = linear(bias = var_515_to_fp16, weight = var_514_to_fp16, x = x_47_cast_fp16)[name = string("linear_21_cast_fp16")]; tensor x_49_cast_fp16 = add(x = x_43_cast_fp16, y = linear_21_cast_fp16)[name = string("x_49_cast_fp16")]; tensor var_522_axes_0 = const()[name = string("op_522_axes_0"), val = tensor([-1])]; tensor blocks_3_mlp_ln_weight_to_fp16 = const()[name = string("blocks_3_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(145473344)))]; tensor blocks_3_mlp_ln_bias_to_fp16 = const()[name = string("blocks_3_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(145475968)))]; tensor var_522_cast_fp16 = layer_norm(axes = var_522_axes_0, beta = blocks_3_mlp_ln_bias_to_fp16, epsilon = var_448_to_fp16, gamma = blocks_3_mlp_ln_weight_to_fp16, x = x_49_cast_fp16)[name = string("op_522_cast_fp16")]; tensor var_531_to_fp16 = const()[name = string("op_531_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(145478592)))]; tensor var_532_to_fp16 = const()[name = string("op_532_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(158585856)))]; tensor linear_22_cast_fp16 = linear(bias = var_532_to_fp16, weight = var_531_to_fp16, x = var_522_cast_fp16)[name = string("linear_22_cast_fp16")]; string x_53_mode_0 = const()[name = string("x_53_mode_0"), val = string("EXACT")]; tensor x_53_cast_fp16 = gelu(mode = x_53_mode_0, x = linear_22_cast_fp16)[name = string("x_53_cast_fp16")]; tensor var_537_to_fp16 = const()[name = string("op_537_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(158596160)))]; tensor var_538_to_fp16 = const()[name = string("op_538_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(171703424)))]; tensor linear_23_cast_fp16 = linear(bias = var_538_to_fp16, weight = var_537_to_fp16, x = x_53_cast_fp16)[name = string("linear_23_cast_fp16")]; tensor x_55_cast_fp16 = add(x = x_49_cast_fp16, y = linear_23_cast_fp16)[name = string("x_55_cast_fp16")]; int32 var_548 = const()[name = string("op_548"), val = int32(-1)]; tensor var_564_axes_0 = const()[name = string("op_564_axes_0"), val = tensor([-1])]; tensor blocks_4_attn_ln_weight_to_fp16 = const()[name = string("blocks_4_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(171706048)))]; tensor blocks_4_attn_ln_bias_to_fp16 = const()[name = string("blocks_4_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(171708672)))]; fp16 var_554_to_fp16 = const()[name = string("op_554_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_564_cast_fp16 = layer_norm(axes = var_564_axes_0, beta = blocks_4_attn_ln_bias_to_fp16, epsilon = var_554_to_fp16, gamma = blocks_4_attn_ln_weight_to_fp16, x = x_55_cast_fp16)[name = string("op_564_cast_fp16")]; tensor var_575_to_fp16 = const()[name = string("op_575_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(171711296)))]; tensor var_576_to_fp16 = const()[name = string("op_576_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(174988160)))]; tensor linear_24_cast_fp16 = linear(bias = var_576_to_fp16, weight = var_575_to_fp16, x = var_564_cast_fp16)[name = string("linear_24_cast_fp16")]; tensor var_579_to_fp16 = const()[name = string("op_579_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(174990784)))]; tensor linear_25_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_579_to_fp16, x = var_564_cast_fp16)[name = string("linear_25_cast_fp16")]; tensor var_583_to_fp16 = const()[name = string("op_583_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(178267648)))]; tensor var_584_to_fp16 = const()[name = string("op_584_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/0-weight.bin"), offset = uint64(181544512)))]; tensor linear_26_cast_fp16 = linear(bias = var_584_to_fp16, weight = var_583_to_fp16, x = var_564_cast_fp16)[name = string("linear_26_cast_fp16")]; tensor var_592 = const()[name = string("op_592"), val = tensor([1, 1500, 20, -1])]; tensor var_593_cast_fp16 = reshape(shape = var_592, x = linear_24_cast_fp16)[name = string("op_593_cast_fp16")]; tensor const_232_to_fp16 = const()[name = string("const_232_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_19_cast_fp16 = mul(x = var_593_cast_fp16, y = const_232_to_fp16)[name = string("q_19_cast_fp16")]; tensor var_599 = const()[name = string("op_599"), val = tensor([1, 1500, 20, -1])]; tensor var_600_cast_fp16 = reshape(shape = var_599, x = linear_25_cast_fp16)[name = string("op_600_cast_fp16")]; tensor const_233_to_fp16 = const()[name = string("const_233_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_19_cast_fp16 = mul(x = var_600_cast_fp16, y = const_233_to_fp16)[name = string("k_19_cast_fp16")]; tensor var_606 = const()[name = string("op_606"), val = tensor([1, 1500, 20, -1])]; tensor var_607_cast_fp16 = reshape(shape = var_606, x = linear_26_cast_fp16)[name = string("op_607_cast_fp16")]; tensor var_608 = const()[name = string("op_608"), val = tensor([0, 2, -3, -1])]; bool qk_9_transpose_x_0 = const()[name = string("qk_9_transpose_x_0"), val = bool(false)]; bool qk_9_transpose_y_0 = const()[name = string("qk_9_transpose_y_0"), val = bool(false)]; tensor transpose_72_perm_0 = const()[name = string("transpose_72_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_73_perm_0 = const()[name = string("transpose_73_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_73 = transpose(perm = transpose_73_perm_0, x = k_19_cast_fp16)[name = string("transpose_142")]; tensor transpose_72 = transpose(perm = transpose_72_perm_0, x = q_19_cast_fp16)[name = string("transpose_143")]; tensor qk_9_cast_fp16 = matmul(transpose_x = qk_9_transpose_x_0, transpose_y = qk_9_transpose_y_0, x = transpose_72, y = transpose_73)[name = string("qk_9_cast_fp16")]; tensor var_612_cast_fp16 = softmax(axis = var_548, x = qk_9_cast_fp16)[name = string("op_612_cast_fp16")]; bool var_614_transpose_x_0 = const()[name = string("op_614_transpose_x_0"), val = bool(false)]; bool var_614_transpose_y_0 = const()[name = string("op_614_transpose_y_0"), val = bool(false)]; tensor v_19_cast_fp16 = transpose(perm = var_608, x = var_607_cast_fp16)[name = string("transpose_141")]; tensor var_614_cast_fp16 = matmul(transpose_x = var_614_transpose_x_0, transpose_y = var_614_transpose_y_0, x = var_612_cast_fp16, y = v_19_cast_fp16)[name = string("op_614_cast_fp16")]; tensor var_615 = const()[name = string("op_615"), val = tensor([0, 2, 1, 3])]; tensor concat_4 = const()[name = string("concat_4"), val = tensor([1, 1500, 1280])]; tensor var_616_cast_fp16 = transpose(perm = var_615, x = var_614_cast_fp16)[name = string("transpose_140")]; tensor x_59_cast_fp16 = reshape(shape = concat_4, x = var_616_cast_fp16)[name = string("x_59_cast_fp16")]; tensor