program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.7.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})] { func main(tensor decoder_input_ids, tensor encoder_attention_mask, tensor encoder_hidden_states) [FlexibleShapeInformation = tuple, dict, tensor>>, tuple, dict, list, ?>>>>((("DefaultShapes", {{"decoder_input_ids", [1, 8]}, {"encoder_attention_mask", [1, 16]}, {"encoder_hidden_states", [1, 16, 256]}}), ("RangeDims", {{"decoder_input_ids", [[1, 1], [1, 128]]}, {"encoder_attention_mask", [[1, 1], [1, 64]]}, {"encoder_hidden_states", [[1, 1], [1, 64], [256, 256]]}})))] { tensor decoder_embed_tokens_weight = const()[name = tensor("decoder_embed_tokens_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor decoder_block_0_layer_0_layer_norm_weight = const()[name = tensor("decoder_block_0_layer_0_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(393344)))]; tensor decoder_block_0_layer_0_SelfAttention_q_weight = const()[name = tensor("decoder_block_0_layer_0_SelfAttention_q_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394432)))]; tensor decoder_block_0_layer_0_SelfAttention_k_weight = const()[name = tensor("decoder_block_0_layer_0_SelfAttention_k_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(787712)))]; tensor decoder_block_0_layer_0_SelfAttention_v_weight = const()[name = tensor("decoder_block_0_layer_0_SelfAttention_v_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1180992)))]; tensor decoder_block_0_layer_0_SelfAttention_relative_attention_bias_weight = const()[name = tensor("decoder_block_0_layer_0_SelfAttention_relative_attention_bias_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1574272)))]; tensor decoder_block_0_layer_0_SelfAttention_o_weight = const()[name = tensor("decoder_block_0_layer_0_SelfAttention_o_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1575104)))]; tensor decoder_block_0_layer_1_layer_norm_weight = const()[name = tensor("decoder_block_0_layer_1_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1968384)))]; tensor decoder_block_0_layer_1_EncDecAttention_q_weight = const()[name = tensor("decoder_block_0_layer_1_EncDecAttention_q_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1969472)))]; tensor decoder_block_0_layer_1_EncDecAttention_k_weight = const()[name = tensor("decoder_block_0_layer_1_EncDecAttention_k_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2362752)))]; tensor decoder_block_0_layer_1_EncDecAttention_v_weight = const()[name = tensor("decoder_block_0_layer_1_EncDecAttention_v_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2756032)))]; tensor decoder_block_0_layer_1_EncDecAttention_o_weight = const()[name = tensor("decoder_block_0_layer_1_EncDecAttention_o_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3149312)))]; tensor decoder_block_0_layer_2_layer_norm_weight = const()[name = tensor("decoder_block_0_layer_2_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3542592)))]; tensor decoder_block_0_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor("decoder_block_0_layer_2_DenseReluDense_wi_0_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3543680)))]; tensor decoder_block_0_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor("decoder_block_0_layer_2_DenseReluDense_wi_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4592320)))]; tensor decoder_block_0_layer_2_DenseReluDense_wo_weight = const()[name = tensor("decoder_block_0_layer_2_DenseReluDense_wo_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5640960)))]; tensor decoder_block_1_layer_0_layer_norm_weight = const()[name = tensor("decoder_block_1_layer_0_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6689600)))]; tensor decoder_block_1_layer_0_SelfAttention_q_weight = const()[name = tensor("decoder_block_1_layer_0_SelfAttention_q_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6690688)))]; tensor decoder_block_1_layer_0_SelfAttention_k_weight = const()[name = tensor("decoder_block_1_layer_0_SelfAttention_k_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7083968)))]; tensor decoder_block_1_layer_0_SelfAttention_v_weight = const()[name = tensor("decoder_block_1_layer_0_SelfAttention_v_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7477248)))]; tensor decoder_block_1_layer_0_SelfAttention_o_weight = const()[name = tensor("decoder_block_1_layer_0_SelfAttention_o_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7870528)))]; tensor decoder_block_1_layer_1_layer_norm_weight = const()[name = tensor("decoder_block_1_layer_1_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8263808)))]; tensor decoder_block_1_layer_1_EncDecAttention_q_weight = const()[name = tensor("decoder_block_1_layer_1_EncDecAttention_q_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8264896)))]; tensor decoder_block_1_layer_1_EncDecAttention_k_weight = const()[name = tensor("decoder_block_1_layer_1_EncDecAttention_k_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8658176)))]; tensor decoder_block_1_layer_1_EncDecAttention_v_weight = const()[name = tensor("decoder_block_1_layer_1_EncDecAttention_v_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9051456)))]; tensor decoder_block_1_layer_1_EncDecAttention_o_weight = const()[name = tensor("decoder_block_1_layer_1_EncDecAttention_o_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9444736)))]; tensor decoder_block_1_layer_2_layer_norm_weight = const()[name = tensor("decoder_block_1_layer_2_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9838016)))]; tensor decoder_block_1_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor("decoder_block_1_layer_2_DenseReluDense_wi_0_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9839104)))]; tensor decoder_block_1_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor("decoder_block_1_layer_2_DenseReluDense_wi_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10887744)))]; tensor decoder_block_1_layer_2_DenseReluDense_wo_weight = const()[name = tensor("decoder_block_1_layer_2_DenseReluDense_wo_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11936384)))]; tensor decoder_block_2_layer_0_layer_norm_weight = const()[name = tensor("decoder_block_2_layer_0_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12985024)))]; tensor decoder_block_2_layer_0_SelfAttention_q_weight = const()[name = tensor("decoder_block_2_layer_0_SelfAttention_q_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12986112)))]; tensor decoder_block_2_layer_0_SelfAttention_k_weight = const()[name = tensor("decoder_block_2_layer_0_SelfAttention_k_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13379392)))]; tensor decoder_block_2_layer_0_SelfAttention_v_weight = const()[name = tensor("decoder_block_2_layer_0_SelfAttention_v_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13772672)))]; tensor decoder_block_2_layer_0_SelfAttention_o_weight = const()[name = tensor("decoder_block_2_layer_0_SelfAttention_o_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14165952)))]; tensor decoder_block_2_layer_1_layer_norm_weight = const()[name = tensor("decoder_block_2_layer_1_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14559232)))]; tensor decoder_block_2_layer_1_EncDecAttention_q_weight = const()[name = tensor("decoder_block_2_layer_1_EncDecAttention_q_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14560320)))]; tensor decoder_block_2_layer_1_EncDecAttention_k_weight = const()[name = tensor("decoder_block_2_layer_1_EncDecAttention_k_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14953600)))]; tensor decoder_block_2_layer_1_EncDecAttention_v_weight = const()[name = tensor("decoder_block_2_layer_1_EncDecAttention_v_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15346880)))]; tensor decoder_block_2_layer_1_EncDecAttention_o_weight = const()[name = tensor("decoder_block_2_layer_1_EncDecAttention_o_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15740160)))]; tensor decoder_block_2_layer_2_layer_norm_weight = const()[name = tensor("decoder_block_2_layer_2_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16133440)))]; tensor decoder_block_2_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor("decoder_block_2_layer_2_DenseReluDense_wi_0_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16134528)))]; tensor decoder_block_2_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor("decoder_block_2_layer_2_DenseReluDense_wi_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17183168)))]; tensor decoder_block_2_layer_2_DenseReluDense_wo_weight = const()[name = tensor("decoder_block_2_layer_2_DenseReluDense_wo_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18231808)))]; tensor decoder_block_3_layer_0_layer_norm_weight = const()[name = tensor("decoder_block_3_layer_0_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19280448)))]; tensor decoder_block_3_layer_0_SelfAttention_q_weight = const()[name = tensor("decoder_block_3_layer_0_SelfAttention_q_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19281536)))]; tensor decoder_block_3_layer_0_SelfAttention_k_weight = const()[name = tensor("decoder_block_3_layer_0_SelfAttention_k_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19674816)))]; tensor decoder_block_3_layer_0_SelfAttention_v_weight = const()[name = tensor("decoder_block_3_layer_0_SelfAttention_v_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20068096)))]; tensor decoder_block_3_layer_0_SelfAttention_o_weight = const()[name = tensor("decoder_block_3_layer_0_SelfAttention_o_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20461376)))]; tensor decoder_block_3_layer_1_layer_norm_weight = const()[name = tensor("decoder_block_3_layer_1_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20854656)))]; tensor decoder_block_3_layer_1_EncDecAttention_q_weight = const()[name = tensor("decoder_block_3_layer_1_EncDecAttention_q_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20855744)))]; tensor decoder_block_3_layer_1_EncDecAttention_k_weight = const()[name = tensor("decoder_block_3_layer_1_EncDecAttention_k_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21249024)))]; tensor decoder_block_3_layer_1_EncDecAttention_v_weight = const()[name = tensor("decoder_block_3_layer_1_EncDecAttention_v_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21642304)))]; tensor decoder_block_3_layer_1_EncDecAttention_o_weight = const()[name = tensor("decoder_block_3_layer_1_EncDecAttention_o_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22035584)))]; tensor decoder_block_3_layer_2_layer_norm_weight = const()[name = tensor("decoder_block_3_layer_2_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22428864)))]; tensor decoder_block_3_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor("decoder_block_3_layer_2_DenseReluDense_wi_0_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22429952)))]; tensor decoder_block_3_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor("decoder_block_3_layer_2_DenseReluDense_wi_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23478592)))]; tensor decoder_block_3_layer_2_DenseReluDense_wo_weight = const()[name = tensor("decoder_block_3_layer_2_DenseReluDense_wo_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24527232)))]; tensor decoder_final_layer_norm_weight = const()[name = tensor("decoder_final_layer_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25575872)))]; tensor lm_head_weight = const()[name = tensor("lm_head_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25576960)))]; tensor var_8 = const()[name = tensor("op_8"), val = tensor(16)]; tensor var_14 = const()[name = tensor("op_14"), val = tensor(0x1p+0)]; tensor var_16 = const()[name = tensor("op_16"), val = tensor(6)]; tensor var_22 = const()[name = tensor("op_22"), val = tensor(-1)]; tensor var_23 = const()[name = tensor("op_23"), val = tensor(1)]; tensor var_35_shape = shape(x = decoder_input_ids)[name = tensor("op_35_shape")]; tensor gather_0 = const()[name = tensor("gather_0"), val = tensor(1)]; tensor gather_1_batch_dims_0 = const()[name = tensor("gather_1_batch_dims_0"), val = tensor(0)]; tensor gather_1_validate_indices_0 = const()[name = tensor("gather_1_validate_indices_0"), val = tensor(false)]; tensor select_0 = const()[name = tensor("select_0"), val = tensor(1)]; tensor gather_1_axis_1 = const()[name = tensor("gather_1_axis_1"), val = tensor(0)]; tensor gather_1 = gather(axis = gather_1_axis_1, batch_dims = gather_1_batch_dims_0, indices = select_0, validate_indices = gather_1_validate_indices_0, x = var_35_shape)[name = tensor("gather_1")]; tensor input_3_batch_dims_0 = const()[name = tensor("input_3_batch_dims_0"), val = tensor(0)]; tensor input_3_validate_indices_0 = const()[name = tensor("input_3_validate_indices_0"), val = tensor(false)]; tensor greater_equal_1_y_0 = const()[name = tensor("greater_equal_1_y_0"), val = tensor(0)]; tensor greater_equal_1 = greater_equal(x = decoder_input_ids, y = greater_equal_1_y_0)[name = tensor("greater_equal_1")]; tensor slice_by_index_1 = const()[name = tensor("slice_by_index_1"), val = tensor(384)]; tensor add_1 = add(x = decoder_input_ids, y = slice_by_index_1)[name = tensor("add_1")]; tensor select_1 = select(a = decoder_input_ids, b = add_1, cond = greater_equal_1)[name = tensor("select_1")]; tensor input_3_axis_1 = const()[name = tensor("input_3_axis_1"), val = tensor(0)]; tensor input_3 = gather(axis = input_3_axis_1, batch_dims = input_3_batch_dims_0, indices = select_1, validate_indices = input_3_validate_indices_0, x = decoder_embed_tokens_weight)[name = tensor("input_3")]; tensor concat_1_axis_0 = const()[name = tensor("concat_1_axis_0"), val = tensor(0)]; tensor concat_1_interleave_0 = const()[name = tensor("concat_1_interleave_0"), val = tensor(false)]; tensor concat_1 = concat(axis = concat_1_axis_0, interleave = concat_1_interleave_0, values = (gather_0, gather_1))[name = tensor("concat_1")]; tensor fill_0_value_0 = const()[name = tensor("fill_0_value_0"), val = tensor(0x1p+0)]; tensor fill_0 = fill(shape = concat_1, value = fill_0_value_0)[name = tensor("fill_0")]; tensor const_0 = const()[name = tensor("const_0"), val = tensor(0)]; tensor const_1 = const()[name = tensor("const_1"), val = tensor(1)]; tensor seq_ids = range_1d(end = gather_1, start = const_0, step = const_1)[name = tensor("seq_ids")]; tensor var_44_axes_0 = const()[name = tensor("op_44_axes_0"), val = tensor([0])]; tensor var_44 = expand_dims(axes = var_44_axes_0, x = seq_ids)[name = tensor("op_44")]; tensor var_45_axes_0 = const()[name = tensor("op_45_axes_0"), val = tensor([1])]; tensor var_45 = expand_dims(axes = var_45_axes_0, x = var_44)[name = tensor("op_45")]; tensor