| program(1.0) |
| [buildInfo = dict<tensor<string, []>, tensor<string, []>>({{"coremlc-component-MIL", "3520.4.1"}, {"coremlc-version", "3520.5.1"}, {"coremltools-component-torch", "2.9.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})] |
| { |
| func main<ios17>(tensor<int32, [1, 256]> attention_mask, tensor<int32, [1, 256]> input_ids) { |
| tensor<int32, []> var_16 = const()[name = tensor<string, []>("op_16"), val = tensor<int32, []>(0)]; |
| tensor<int32, []> var_18 = const()[name = tensor<string, []>("op_18"), val = tensor<int32, []>(-1)]; |
| tensor<int32, []> var_19 = const()[name = tensor<string, []>("op_19"), val = tensor<int32, []>(1)]; |
| tensor<int32, []> var_55_batch_dims_0 = const()[name = tensor<string, []>("op_55_batch_dims_0"), val = tensor<int32, []>(0)]; |
| tensor<bool, []> var_55_validate_indices_0 = const()[name = tensor<string, []>("op_55_validate_indices_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [256206, 1024]> encoder_embed_tokens_weight_to_fp16 = const()[name = tensor<string, []>("encoder_embed_tokens_weight_to_fp16"), val = tensor<fp16, [256206, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(64)))]; |
| tensor<int32, []> greater_equal_0_y_0 = const()[name = tensor<string, []>("greater_equal_0_y_0"), val = tensor<int32, []>(0)]; |
| tensor<bool, [1, 256]> greater_equal_0 = greater_equal(x = input_ids, y = greater_equal_0_y_0)[name = tensor<string, []>("greater_equal_0")]; |
| tensor<int32, []> slice_by_index_0 = const()[name = tensor<string, []>("slice_by_index_0"), val = tensor<int32, []>(256206)]; |
| tensor<int32, [1, 256]> add_0 = add(x = input_ids, y = slice_by_index_0)[name = tensor<string, []>("add_0")]; |
| tensor<int32, [1, 256]> select_0 = select(a = input_ids, b = add_0, cond = greater_equal_0)[name = tensor<string, []>("select_0")]; |
| tensor<int32, []> var_55_cast_fp16_axis_0 = const()[name = tensor<string, []>("op_55_cast_fp16_axis_0"), val = tensor<int32, []>(0)]; |
| tensor<fp16, [1, 256, 1024]> var_55_cast_fp16 = gather(axis = var_55_cast_fp16_axis_0, batch_dims = var_55_batch_dims_0, indices = select_0, validate_indices = var_55_validate_indices_0, x = encoder_embed_tokens_weight_to_fp16)[name = tensor<string, []>("op_55_cast_fp16")]; |
| tensor<fp16, []> var_56_to_fp16 = const()[name = tensor<string, []>("op_56_to_fp16"), val = tensor<fp16, []>(0x1p+5)]; |
| tensor<fp16, [1, 256, 1024]> inputs_embeds_1_cast_fp16 = mul(x = var_55_cast_fp16, y = var_56_to_fp16)[name = tensor<string, []>("inputs_embeds_1_cast_fp16")]; |
| tensor<bool, [1, 256]> var_61 = not_equal(x = input_ids, y = var_19)[name = tensor<string, []>("op_61")]; |
| tensor<string, []> mask_1_dtype_0 = const()[name = tensor<string, []>("mask_1_dtype_0"), val = tensor<string, []>("int32")]; |
| tensor<bool, []> var_63_exclusive_0 = const()[name = tensor<string, []>("op_63_exclusive_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_63_reverse_0 = const()[name = tensor<string, []>("op_63_reverse_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [1, 256]> mask_1 = cast(dtype = mask_1_dtype_0, x = var_61)[name = tensor<string, []>("cast_56")]; |
| tensor<int32, [1, 256]> var_63 = cumsum(axis = var_19, exclusive = var_63_exclusive_0, reverse = var_63_reverse_0, x = mask_1)[name = tensor<string, []>("op_63")]; |
| tensor<int32, [1, 256]> incremental_indices_1 = mul(x = var_63, y = mask_1)[name = tensor<string, []>("incremental_indices_1")]; |
| tensor<int32, []> var_69 = const()[name = tensor<string, []>("op_69"), val = tensor<int32, []>(1)]; |
| tensor<int32, [1, 256]> var_70 = add(x = incremental_indices_1, y = var_69)[name = tensor<string, []>("op_70")]; |
| tensor<int32, [1]> var_72 = const()[name = tensor<string, []>("op_72"), val = tensor<int32, [1]>([-1])]; |
| tensor<int32, [256]> var_73 = reshape(shape = var_72, x = var_70)[name = tensor<string, []>("op_73")]; |
| tensor<int32, []> var_74_batch_dims_0 = const()[name = tensor<string, []>("op_74_batch_dims_0"), val = tensor<int32, []>(0)]; |
| tensor<bool, []> var_74_validate_indices_0 = const()[name = tensor<string, []>("op_74_validate_indices_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1026, 1024]> encoder_embed_positions_weights_to_fp16 = const()[name = tensor<string, []>("encoder_embed_positions_weights_to_fp16"), val = tensor<fp16, [1026, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(524710016)))]; |
| tensor<string, []> var_73_to_uint16_dtype_0 = const()[name = tensor<string, []>("op_73_to_uint16_dtype_0"), val = tensor<string, []>("uint16")]; |
| tensor<uint16, [256]> var_73_to_uint16 = cast(dtype = var_73_to_uint16_dtype_0, x = var_73)[name = tensor<string, []>("cast_55")]; |
| tensor<fp16, [256, 1024]> var_74_cast_fp16_cast_uint16 = gather(axis = var_16, batch_dims = var_74_batch_dims_0, indices = var_73_to_uint16, validate_indices = var_74_validate_indices_0, x = encoder_embed_positions_weights_to_fp16)[name = tensor<string, []>("op_74_cast_fp16_cast_uint16")]; |
| tensor<int32, [3]> var_76 = const()[name = tensor<string, []>("op_76"), val = tensor<int32, [3]>([1, 256, 1024])]; |
| tensor<fp16, [1, 256, 1024]> var_77_cast_fp16 = reshape(shape = var_76, x = var_74_cast_fp16_cast_uint16)[name = tensor<string, []>("op_77_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input0_7_cast_fp16 = add(x = inputs_embeds_1_cast_fp16, y = var_77_cast_fp16)[name = tensor<string, []>("input0_7_cast_fp16")]; |
| tensor<int32, [1]> var_85_axes_0 = const()[name = tensor<string, []>("op_85_axes_0"), val = tensor<int32, [1]>([1])]; |
| tensor<int32, [1, 1, 256]> var_85 = expand_dims(axes = var_85_axes_0, x = attention_mask)[name = tensor<string, []>("op_85")]; |
| tensor<int32, [1]> var_86_axes_0 = const()[name = tensor<string, []>("op_86_axes_0"), val = tensor<int32, [1]>([2])]; |
| tensor<int32, [1, 1, 1, 256]> var_86 = expand_dims(axes = var_86_axes_0, x = var_85)[name = tensor<string, []>("op_86")]; |
| tensor<int32, [4]> var_89_reps_0 = const()[name = tensor<string, []>("op_89_reps_0"), val = tensor<int32, [4]>([1, 1, 256, 1])]; |
| tensor<int32, [1, 1, 256, 256]> var_89 = tile(reps = var_89_reps_0, x = var_86)[name = tensor<string, []>("op_89")]; |
| tensor<fp16, []> const_6_to_fp16 = const()[name = tensor<string, []>("const_6_to_fp16"), val = tensor<fp16, []>(0x1p+0)]; |
| tensor<string, []> expanded_mask_1_to_fp16_dtype_0 = const()[name = tensor<string, []>("expanded_mask_1_to_fp16_dtype_0"), val = tensor<string, []>("fp16")]; |
| tensor<fp16, [1, 1, 256, 256]> var_89_to_fp16 = cast(dtype = expanded_mask_1_to_fp16_dtype_0, x = var_89)[name = tensor<string, []>("cast_54")]; |
| tensor<fp16, [1, 1, 256, 256]> inverted_mask_1_cast_fp16 = sub(x = const_6_to_fp16, y = var_89_to_fp16)[name = tensor<string, []>("inverted_mask_1_cast_fp16")]; |
| tensor<string, []> var_94_dtype_0 = const()[name = tensor<string, []>("op_94_dtype_0"), val = tensor<string, []>("bool")]; |
| tensor<fp16, []> var_10_to_fp16 = const()[name = tensor<string, []>("op_10_to_fp16"), val = tensor<fp16, []>(-inf)]; |
| tensor<bool, [1, 1, 256, 256]> inverted_mask_1_cast_fp16_to_bool = cast(dtype = var_94_dtype_0, x = inverted_mask_1_cast_fp16)[name = tensor<string, []>("cast_53")]; |
| tensor<fp16, [1, 1, 256, 256]> attention_mask0_1_cast_fp16 = select(a = var_10_to_fp16, b = inverted_mask_1_cast_fp16, cond = inverted_mask_1_cast_fp16_to_bool)[name = tensor<string, []>("attention_mask0_1_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_3_axes_0 = const()[name = tensor<string, []>("hidden_states_3_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_0_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(526811328)))]; |
| tensor<fp16, [1024]> encoder_layers_0_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(526813440)))]; |
| tensor<fp16, []> var_6_to_fp16 = const()[name = tensor<string, []>("op_6_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_3_cast_fp16 = layer_norm(axes = hidden_states_3_axes_0, beta = encoder_layers_0_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_0_self_attn_layer_norm_weight_to_fp16, x = input0_7_cast_fp16)[name = tensor<string, []>("hidden_states_3_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_0_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(526815552)))]; |
| tensor<fp16, [1024]> encoder_layers_0_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(528912768)))]; |
| tensor<fp16, [1, 256, 1024]> linear_0_cast_fp16 = linear(bias = encoder_layers_0_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_q_proj_weight_to_fp16, x = hidden_states_3_cast_fp16)[name = tensor<string, []>("linear_0_cast_fp16")]; |
| tensor<int32, [4]> var_114 = const()[name = tensor<string, []>("op_114"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_115_cast_fp16 = reshape(shape = var_114, x = linear_0_cast_fp16)[name = tensor<string, []>("op_115_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_0_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(528914880)))]; |
| tensor<fp16, [1024]> encoder_layers_0_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(531012096)))]; |
| tensor<fp16, [1, 256, 1024]> linear_1_cast_fp16 = linear(bias = encoder_layers_0_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_k_proj_weight_to_fp16, x = hidden_states_3_cast_fp16)[name = tensor<string, []>("linear_1_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_0_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(531014208)))]; |
| tensor<fp16, [1024]> encoder_layers_0_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(533111424)))]; |
| tensor<fp16, [1, 256, 1024]> linear_2_cast_fp16 = linear(bias = encoder_layers_0_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_v_proj_weight_to_fp16, x = hidden_states_3_cast_fp16)[name = tensor<string, []>("linear_2_cast_fp16")]; |
| tensor<int32, [4]> var_123 = const()[name = tensor<string, []>("op_123"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_124_cast_fp16 = reshape(shape = var_123, x = linear_1_cast_fp16)[name = tensor<string, []>("op_124_cast_fp16")]; |
| tensor<int32, [4]> var_126 = const()[name = tensor<string, []>("op_126"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_127_cast_fp16 = reshape(shape = var_126, x = linear_2_cast_fp16)[name = tensor<string, []>("op_127_cast_fp16")]; |
| tensor<int32, [4]> value_2_perm_0 = const()[name = tensor<string, []>("value_2_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_130_transpose_x_0 = const()[name = tensor<string, []>("op_130_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_130_transpose_y_0 = const()[name = tensor<string, []>("op_130_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_36_perm_0 = const()[name = tensor<string, []>("transpose_36_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_37_perm_0 = const()[name = tensor<string, []>("transpose_37_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_37 = transpose(perm = transpose_37_perm_0, x = var_124_cast_fp16)[name = tensor<string, []>("transpose_105")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_36 = transpose(perm = transpose_36_perm_0, x = var_115_cast_fp16)[name = tensor<string, []>("transpose_106")]; |
| tensor<fp16, [1, 16, 256, 256]> var_130_cast_fp16 = matmul(transpose_x = var_130_transpose_x_0, transpose_y = var_130_transpose_y_0, x = transpose_36, y = transpose_37)[name = tensor<string, []>("op_130_cast_fp16")]; |
| tensor<fp16, []> var_131_to_fp16 = const()[name = tensor<string, []>("op_131_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_2_cast_fp16 = mul(x = var_130_cast_fp16, y = var_131_to_fp16)[name = tensor<string, []>("attn_weights_2_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_5_cast_fp16 = add(x = attn_weights_2_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_5_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input4_1_cast_fp16 = softmax(axis = var_18, x = input_5_cast_fp16)[name = tensor<string, []>("input4_1_cast_fp16")]; |
| tensor<bool, []> attn_output_2_transpose_x_0 = const()[name = tensor<string, []>("attn_output_2_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_2_transpose_y_0 = const()[name = tensor<string, []>("attn_output_2_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_2_cast_fp16 = transpose(perm = value_2_perm_0, x = var_127_cast_fp16)[name = tensor<string, []>("transpose_107")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_2_cast_fp16 = matmul(transpose_x = attn_output_2_transpose_x_0, transpose_y = attn_output_2_transpose_y_0, x = input4_1_cast_fp16, y = value_2_cast_fp16)[name = tensor<string, []>("attn_output_2_cast_fp16")]; |
| tensor<int32, [4]> var_137_perm_0 = const()[name = tensor<string, []>("op_137_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_139 = const()[name = tensor<string, []>("op_139"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_137_cast_fp16 = transpose(perm = var_137_perm_0, x = attn_output_2_cast_fp16)[name = tensor<string, []>("transpose_104")]; |
| tensor<fp16, [1, 256, 1024]> var_140_cast_fp16 = reshape(shape = var_139, x = var_137_cast_fp16)[name = tensor<string, []>("op_140_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_0_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(533113536)))]; |
| tensor<fp16, [1024]> encoder_layers_0_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(535210752)))]; |
| tensor<fp16, [1, 256, 1024]> linear_3_cast_fp16 = linear(bias = encoder_layers_0_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_out_proj_weight_to_fp16, x = var_140_cast_fp16)[name = tensor<string, []>("linear_3_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input2_1_cast_fp16 = add(x = input0_7_cast_fp16, y = linear_3_cast_fp16)[name = tensor<string, []>("input2_1_cast_fp16")]; |
| tensor<int32, [1]> input0_5_axes_0 = const()[name = tensor<string, []>("input0_5_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_0_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(535212864)))]; |
| tensor<fp16, [1024]> encoder_layers_0_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(535214976)))]; |
| tensor<fp16, [1, 256, 1024]> input0_5_cast_fp16 = layer_norm(axes = input0_5_axes_0, beta = encoder_layers_0_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_0_final_layer_norm_weight_to_fp16, x = input2_1_cast_fp16)[name = tensor<string, []>("input0_5_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_0_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(535217088)))]; |
| tensor<fp16, [4096]> encoder_layers_0_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(543605760)))]; |
| tensor<fp16, [1, 256, 4096]> linear_4_cast_fp16 = linear(bias = encoder_layers_0_fc1_bias_to_fp16, weight = encoder_layers_0_fc1_weight_to_fp16, x = input0_5_cast_fp16)[name = tensor<string, []>("linear_4_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_154_cast_fp16 = relu(x = linear_4_cast_fp16)[name = tensor<string, []>("op_154_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_0_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(543614016)))]; |
| tensor<fp16, [1024]> encoder_layers_0_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_0_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(552002688)))]; |
| tensor<fp16, [1, 256, 1024]> linear_5_cast_fp16 = linear(bias = encoder_layers_0_fc2_bias_to_fp16, weight = encoder_layers_0_fc2_weight_to_fp16, x = var_154_cast_fp16)[name = tensor<string, []>("linear_5_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_160_cast_fp16 = add(x = input2_1_cast_fp16, y = linear_5_cast_fp16)[name = tensor<string, []>("op_160_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_7_axes_0 = const()[name = tensor<string, []>("hidden_states_7_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_1_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(552004800)))]; |
| tensor<fp16, [1024]> encoder_layers_1_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(552006912)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_7_cast_fp16 = layer_norm(axes = hidden_states_7_axes_0, beta = encoder_layers_1_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_1_self_attn_layer_norm_weight_to_fp16, x = var_160_cast_fp16)[name = tensor<string, []>("hidden_states_7_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_1_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(552009024)))]; |
| tensor<fp16, [1024]> encoder_layers_1_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(554106240)))]; |
| tensor<fp16, [1, 256, 1024]> linear_6_cast_fp16 = linear(bias = encoder_layers_1_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_q_proj_weight_to_fp16, x = hidden_states_7_cast_fp16)[name = tensor<string, []>("linear_6_cast_fp16")]; |
| tensor<int32, [4]> var_179 = const()[name = tensor<string, []>("op_179"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_180_cast_fp16 = reshape(shape = var_179, x = linear_6_cast_fp16)[name = tensor<string, []>("op_180_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_1_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(554108352)))]; |
| tensor<fp16, [1024]> encoder_layers_1_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(556205568)))]; |
| tensor<fp16, [1, 256, 1024]> linear_7_cast_fp16 = linear(bias = encoder_layers_1_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_k_proj_weight_to_fp16, x = hidden_states_7_cast_fp16)[name = tensor<string, []>("linear_7_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_1_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(556207680)))]; |
| tensor<fp16, [1024]> encoder_layers_1_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(558304896)))]; |
| tensor<fp16, [1, 256, 1024]> linear_8_cast_fp16 = linear(bias = encoder_layers_1_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_v_proj_weight_to_fp16, x = hidden_states_7_cast_fp16)[name = tensor<string, []>("linear_8_cast_fp16")]; |
| tensor<int32, [4]> var_188 = const()[name = tensor<string, []>("op_188"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_189_cast_fp16 = reshape(shape = var_188, x = linear_7_cast_fp16)[name = tensor<string, []>("op_189_cast_fp16")]; |
| tensor<int32, [4]> var_191 = const()[name = tensor<string, []>("op_191"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_192_cast_fp16 = reshape(shape = var_191, x = linear_8_cast_fp16)[name = tensor<string, []>("op_192_cast_fp16")]; |
| tensor<int32, [4]> value_4_perm_0 = const()[name = tensor<string, []>("value_4_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_195_transpose_x_0 = const()[name = tensor<string, []>("op_195_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_195_transpose_y_0 = const()[name = tensor<string, []>("op_195_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_38_perm_0 = const()[name = tensor<string, []>("transpose_38_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_39_perm_0 = const()[name = tensor<string, []>("transpose_39_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_39 = transpose(perm = transpose_39_perm_0, x = var_189_cast_fp16)[name = tensor<string, []>("transpose_101")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_38 = transpose(perm = transpose_38_perm_0, x = var_180_cast_fp16)[name = tensor<string, []>("transpose_102")]; |
| tensor<fp16, [1, 16, 256, 256]> var_195_cast_fp16 = matmul(transpose_x = var_195_transpose_x_0, transpose_y = var_195_transpose_y_0, x = transpose_38, y = transpose_39)[name = tensor<string, []>("op_195_cast_fp16")]; |
| tensor<fp16, []> var_196_to_fp16 = const()[name = tensor<string, []>("op_196_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_4_cast_fp16 = mul(x = var_195_cast_fp16, y = var_196_to_fp16)[name = tensor<string, []>("attn_weights_4_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_11_cast_fp16 = add(x = attn_weights_4_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_11_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_9_cast_fp16 = softmax(axis = var_18, x = input_11_cast_fp16)[name = tensor<string, []>("input0_9_cast_fp16")]; |
| tensor<bool, []> attn_output_4_transpose_x_0 = const()[name = tensor<string, []>("attn_output_4_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_4_transpose_y_0 = const()[name = tensor<string, []>("attn_output_4_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_4_cast_fp16 = transpose(perm = value_4_perm_0, x = var_192_cast_fp16)[name = tensor<string, []>("transpose_103")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_4_cast_fp16 = matmul(transpose_x = attn_output_4_transpose_x_0, transpose_y = attn_output_4_transpose_y_0, x = input0_9_cast_fp16, y = value_4_cast_fp16)[name = tensor<string, []>("attn_output_4_cast_fp16")]; |
| tensor<int32, [4]> var_202_perm_0 = const()[name = tensor<string, []>("op_202_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_204 = const()[name = tensor<string, []>("op_204"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_202_cast_fp16 = transpose(perm = var_202_perm_0, x = attn_output_4_cast_fp16)[name = tensor<string, []>("transpose_100")]; |
| tensor<fp16, [1, 256, 1024]> var_205_cast_fp16 = reshape(shape = var_204, x = var_202_cast_fp16)[name = tensor<string, []>("op_205_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_1_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(558307008)))]; |
| tensor<fp16, [1024]> encoder_layers_1_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(560404224)))]; |
| tensor<fp16, [1, 256, 1024]> linear_9_cast_fp16 = linear(bias = encoder_layers_1_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_out_proj_weight_to_fp16, x = var_205_cast_fp16)[name = tensor<string, []>("linear_9_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_13_cast_fp16 = add(x = var_160_cast_fp16, y = linear_9_cast_fp16)[name = tensor<string, []>("input_13_cast_fp16")]; |
| tensor<int32, [1]> input0_11_axes_0 = const()[name = tensor<string, []>("input0_11_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_1_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(560406336)))]; |
| tensor<fp16, [1024]> encoder_layers_1_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(560408448)))]; |
| tensor<fp16, [1, 256, 1024]> input0_11_cast_fp16 = layer_norm(axes = input0_11_axes_0, beta = encoder_layers_1_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_1_final_layer_norm_weight_to_fp16, x = input_13_cast_fp16)[name = tensor<string, []>("input0_11_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_1_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(560410560)))]; |
| tensor<fp16, [4096]> encoder_layers_1_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(568799232)))]; |
| tensor<fp16, [1, 256, 4096]> linear_10_cast_fp16 = linear(bias = encoder_layers_1_fc1_bias_to_fp16, weight = encoder_layers_1_fc1_weight_to_fp16, x = input0_11_cast_fp16)[name = tensor<string, []>("linear_10_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_219_cast_fp16 = relu(x = linear_10_cast_fp16)[name = tensor<string, []>("op_219_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_1_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(568807488)))]; |
| tensor<fp16, [1024]> encoder_layers_1_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_1_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(577196160)))]; |
| tensor<fp16, [1, 256, 1024]> linear_11_cast_fp16 = linear(bias = encoder_layers_1_fc2_bias_to_fp16, weight = encoder_layers_1_fc2_weight_to_fp16, x = var_219_cast_fp16)[name = tensor<string, []>("linear_11_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_225_cast_fp16 = add(x = input_13_cast_fp16, y = linear_11_cast_fp16)[name = tensor<string, []>("op_225_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_11_axes_0 = const()[name = tensor<string, []>("hidden_states_11_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_2_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(577198272)))]; |
| tensor<fp16, [1024]> encoder_layers_2_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(577200384)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_11_cast_fp16 = layer_norm(axes = hidden_states_11_axes_0, beta = encoder_layers_2_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_2_self_attn_layer_norm_weight_to_fp16, x = var_225_cast_fp16)[name = tensor<string, []>("hidden_states_11_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_2_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(577202496)))]; |
| tensor<fp16, [1024]> encoder_layers_2_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(579299712)))]; |
| tensor<fp16, [1, 256, 1024]> linear_12_cast_fp16 = linear(bias = encoder_layers_2_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_q_proj_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor<string, []>("linear_12_cast_fp16")]; |
| tensor<int32, [4]> var_244 = const()[name = tensor<string, []>("op_244"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_245_cast_fp16 = reshape(shape = var_244, x = linear_12_cast_fp16)[name = tensor<string, []>("op_245_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_2_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(579301824)))]; |
| tensor<fp16, [1024]> encoder_layers_2_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(581399040)))]; |
| tensor<fp16, [1, 256, 1024]> linear_13_cast_fp16 = linear(bias = encoder_layers_2_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_k_proj_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor<string, []>("linear_13_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_2_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(581401152)))]; |
| tensor<fp16, [1024]> encoder_layers_2_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(583498368)))]; |
| tensor<fp16, [1, 256, 1024]> linear_14_cast_fp16 = linear(bias = encoder_layers_2_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_v_proj_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor<string, []>("linear_14_cast_fp16")]; |
| tensor<int32, [4]> var_253 = const()[name = tensor<string, []>("op_253"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_254_cast_fp16 = reshape(shape = var_253, x = linear_13_cast_fp16)[name = tensor<string, []>("op_254_cast_fp16")]; |
| tensor<int32, [4]> var_256 = const()[name = tensor<string, []>("op_256"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_257_cast_fp16 = reshape(shape = var_256, x = linear_14_cast_fp16)[name = tensor<string, []>("op_257_cast_fp16")]; |
| tensor<int32, [4]> value_6_perm_0 = const()[name = tensor<string, []>("value_6_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_260_transpose_x_0 = const()[name = tensor<string, []>("op_260_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_260_transpose_y_0 = const()[name = tensor<string, []>("op_260_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_40_perm_0 = const()[name = tensor<string, []>("transpose_40_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_41_perm_0 = const()[name = tensor<string, []>("transpose_41_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_41 = transpose(perm = transpose_41_perm_0, x = var_254_cast_fp16)[name = tensor<string, []>("transpose_97")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_40 = transpose(perm = transpose_40_perm_0, x = var_245_cast_fp16)[name = tensor<string, []>("transpose_98")]; |
| tensor<fp16, [1, 16, 256, 256]> var_260_cast_fp16 = matmul(transpose_x = var_260_transpose_x_0, transpose_y = var_260_transpose_y_0, x = transpose_40, y = transpose_41)[name = tensor<string, []>("op_260_cast_fp16")]; |
| tensor<fp16, []> var_261_to_fp16 = const()[name = tensor<string, []>("op_261_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_6_cast_fp16 = mul(x = var_260_cast_fp16, y = var_261_to_fp16)[name = tensor<string, []>("attn_weights_6_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_17_cast_fp16 = add(x = attn_weights_6_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_17_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_15_cast_fp16 = softmax(axis = var_18, x = input_17_cast_fp16)[name = tensor<string, []>("input0_15_cast_fp16")]; |
| tensor<bool, []> attn_output_6_transpose_x_0 = const()[name = tensor<string, []>("attn_output_6_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_6_transpose_y_0 = const()[name = tensor<string, []>("attn_output_6_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_6_cast_fp16 = transpose(perm = value_6_perm_0, x = var_257_cast_fp16)[name = tensor<string, []>("transpose_99")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_6_cast_fp16 = matmul(transpose_x = attn_output_6_transpose_x_0, transpose_y = attn_output_6_transpose_y_0, x = input0_15_cast_fp16, y = value_6_cast_fp16)[name = tensor<string, []>("attn_output_6_cast_fp16")]; |
| tensor<int32, [4]> var_267_perm_0 = const()[name = tensor<string, []>("op_267_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_269 = const()[name = tensor<string, []>("op_269"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_267_cast_fp16 = transpose(perm = var_267_perm_0, x = attn_output_6_cast_fp16)[name = tensor<string, []>("transpose_96")]; |
| tensor<fp16, [1, 256, 1024]> var_270_cast_fp16 = reshape(shape = var_269, x = var_267_cast_fp16)[name = tensor<string, []>("op_270_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_2_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(583500480)))]; |
| tensor<fp16, [1024]> encoder_layers_2_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(585597696)))]; |
| tensor<fp16, [1, 256, 1024]> linear_15_cast_fp16 = linear(bias = encoder_layers_2_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_out_proj_weight_to_fp16, x = var_270_cast_fp16)[name = tensor<string, []>("linear_15_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_19_cast_fp16 = add(x = var_225_cast_fp16, y = linear_15_cast_fp16)[name = tensor<string, []>("input_19_cast_fp16")]; |
| tensor<int32, [1]> input0_17_axes_0 = const()[name = tensor<string, []>("input0_17_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_2_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(585599808)))]; |
| tensor<fp16, [1024]> encoder_layers_2_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(585601920)))]; |
| tensor<fp16, [1, 256, 1024]> input0_17_cast_fp16 = layer_norm(axes = input0_17_axes_0, beta = encoder_layers_2_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_2_final_layer_norm_weight_to_fp16, x = input_19_cast_fp16)[name = tensor<string, []>("input0_17_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_2_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(585604032)))]; |
| tensor<fp16, [4096]> encoder_layers_2_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(593992704)))]; |
| tensor<fp16, [1, 256, 4096]> linear_16_cast_fp16 = linear(bias = encoder_layers_2_fc1_bias_to_fp16, weight = encoder_layers_2_fc1_weight_to_fp16, x = input0_17_cast_fp16)[name = tensor<string, []>("linear_16_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_284_cast_fp16 = relu(x = linear_16_cast_fp16)[name = tensor<string, []>("op_284_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_2_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(594000960)))]; |
| tensor<fp16, [1024]> encoder_layers_2_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_2_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(602389632)))]; |
| tensor<fp16, [1, 256, 1024]> linear_17_cast_fp16 = linear(bias = encoder_layers_2_fc2_bias_to_fp16, weight = encoder_layers_2_fc2_weight_to_fp16, x = var_284_cast_fp16)[name = tensor<string, []>("linear_17_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_290_cast_fp16 = add(x = input_19_cast_fp16, y = linear_17_cast_fp16)[name = tensor<string, []>("op_290_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_15_axes_0 = const()[name = tensor<string, []>("hidden_states_15_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_3_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(602391744)))]; |
| tensor<fp16, [1024]> encoder_layers_3_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(602393856)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_15_cast_fp16 = layer_norm(axes = hidden_states_15_axes_0, beta = encoder_layers_3_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_3_self_attn_layer_norm_weight_to_fp16, x = var_290_cast_fp16)[name = tensor<string, []>("hidden_states_15_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_3_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(602395968)))]; |
| tensor<fp16, [1024]> encoder_layers_3_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(604493184)))]; |
| tensor<fp16, [1, 256, 1024]> linear_18_cast_fp16 = linear(bias = encoder_layers_3_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_q_proj_weight_to_fp16, x = hidden_states_15_cast_fp16)[name = tensor<string, []>("linear_18_cast_fp16")]; |
| tensor<int32, [4]> var_309 = const()[name = tensor<string, []>("op_309"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_310_cast_fp16 = reshape(shape = var_309, x = linear_18_cast_fp16)[name = tensor<string, []>("op_310_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_3_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(604495296)))]; |
| tensor<fp16, [1024]> encoder_layers_3_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(606592512)))]; |
| tensor<fp16, [1, 256, 1024]> linear_19_cast_fp16 = linear(bias = encoder_layers_3_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_k_proj_weight_to_fp16, x = hidden_states_15_cast_fp16)[name = tensor<string, []>("linear_19_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_3_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(606594624)))]; |
| tensor<fp16, [1024]> encoder_layers_3_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(608691840)))]; |
| tensor<fp16, [1, 256, 1024]> linear_20_cast_fp16 = linear(bias = encoder_layers_3_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_v_proj_weight_to_fp16, x = hidden_states_15_cast_fp16)[name = tensor<string, []>("linear_20_cast_fp16")]; |
| tensor<int32, [4]> var_318 = const()[name = tensor<string, []>("op_318"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_319_cast_fp16 = reshape(shape = var_318, x = linear_19_cast_fp16)[name = tensor<string, []>("op_319_cast_fp16")]; |
| tensor<int32, [4]> var_321 = const()[name = tensor<string, []>("op_321"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_322_cast_fp16 = reshape(shape = var_321, x = linear_20_cast_fp16)[name = tensor<string, []>("op_322_cast_fp16")]; |
| tensor<int32, [4]> value_8_perm_0 = const()[name = tensor<string, []>("value_8_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_325_transpose_x_0 = const()[name = tensor<string, []>("op_325_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_325_transpose_y_0 = const()[name = tensor<string, []>("op_325_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_42_perm_0 = const()[name = tensor<string, []>("transpose_42_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_43_perm_0 = const()[name = tensor<string, []>("transpose_43_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_43 = transpose(perm = transpose_43_perm_0, x = var_319_cast_fp16)[name = tensor<string, []>("transpose_93")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_42 = transpose(perm = transpose_42_perm_0, x = var_310_cast_fp16)[name = tensor<string, []>("transpose_94")]; |
| tensor<fp16, [1, 16, 256, 256]> var_325_cast_fp16 = matmul(transpose_x = var_325_transpose_x_0, transpose_y = var_325_transpose_y_0, x = transpose_42, y = transpose_43)[name = tensor<string, []>("op_325_cast_fp16")]; |
| tensor<fp16, []> var_326_to_fp16 = const()[name = tensor<string, []>("op_326_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_8_cast_fp16 = mul(x = var_325_cast_fp16, y = var_326_to_fp16)[name = tensor<string, []>("attn_weights_8_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_23_cast_fp16 = add(x = attn_weights_8_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_23_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_21_cast_fp16 = softmax(axis = var_18, x = input_23_cast_fp16)[name = tensor<string, []>("input0_21_cast_fp16")]; |
| tensor<bool, []> attn_output_8_transpose_x_0 = const()[name = tensor<string, []>("attn_output_8_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_8_transpose_y_0 = const()[name = tensor<string, []>("attn_output_8_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_8_cast_fp16 = transpose(perm = value_8_perm_0, x = var_322_cast_fp16)[name = tensor<string, []>("transpose_95")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_8_cast_fp16 = matmul(transpose_x = attn_output_8_transpose_x_0, transpose_y = attn_output_8_transpose_y_0, x = input0_21_cast_fp16, y = value_8_cast_fp16)[name = tensor<string, []>("attn_output_8_cast_fp16")]; |
| tensor<int32, [4]> var_332_perm_0 = const()[name = tensor<string, []>("op_332_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_334 = const()[name = tensor<string, []>("op_334"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_332_cast_fp16 = transpose(perm = var_332_perm_0, x = attn_output_8_cast_fp16)[name = tensor<string, []>("transpose_92")]; |
| tensor<fp16, [1, 256, 1024]> var_335_cast_fp16 = reshape(shape = var_334, x = var_332_cast_fp16)[name = tensor<string, []>("op_335_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_3_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(608693952)))]; |
| tensor<fp16, [1024]> encoder_layers_3_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(610791168)))]; |
| tensor<fp16, [1, 256, 1024]> linear_21_cast_fp16 = linear(bias = encoder_layers_3_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_out_proj_weight_to_fp16, x = var_335_cast_fp16)[name = tensor<string, []>("linear_21_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_25_cast_fp16 = add(x = var_290_cast_fp16, y = linear_21_cast_fp16)[name = tensor<string, []>("input_25_cast_fp16")]; |
| tensor<int32, [1]> input0_23_axes_0 = const()[name = tensor<string, []>("input0_23_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_3_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(610793280)))]; |
| tensor<fp16, [1024]> encoder_layers_3_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(610795392)))]; |
| tensor<fp16, [1, 256, 1024]> input0_23_cast_fp16 = layer_norm(axes = input0_23_axes_0, beta = encoder_layers_3_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_3_final_layer_norm_weight_to_fp16, x = input_25_cast_fp16)[name = tensor<string, []>("input0_23_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_3_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(610797504)))]; |
| tensor<fp16, [4096]> encoder_layers_3_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(619186176)))]; |
| tensor<fp16, [1, 256, 4096]> linear_22_cast_fp16 = linear(bias = encoder_layers_3_fc1_bias_to_fp16, weight = encoder_layers_3_fc1_weight_to_fp16, x = input0_23_cast_fp16)[name = tensor<string, []>("linear_22_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_349_cast_fp16 = relu(x = linear_22_cast_fp16)[name = tensor<string, []>("op_349_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_3_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(619194432)))]; |
| tensor<fp16, [1024]> encoder_layers_3_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_3_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(627583104)))]; |
| tensor<fp16, [1, 256, 1024]> linear_23_cast_fp16 = linear(bias = encoder_layers_3_fc2_bias_to_fp16, weight = encoder_layers_3_fc2_weight_to_fp16, x = var_349_cast_fp16)[name = tensor<string, []>("linear_23_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_355_cast_fp16 = add(x = input_25_cast_fp16, y = linear_23_cast_fp16)[name = tensor<string, []>("op_355_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_19_axes_0 = const()[name = tensor<string, []>("hidden_states_19_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_4_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(627585216)))]; |
| tensor<fp16, [1024]> encoder_layers_4_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(627587328)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_19_cast_fp16 = layer_norm(axes = hidden_states_19_axes_0, beta = encoder_layers_4_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_4_self_attn_layer_norm_weight_to_fp16, x = var_355_cast_fp16)[name = tensor<string, []>("hidden_states_19_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_4_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(627589440)))]; |
| tensor<fp16, [1024]> encoder_layers_4_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(629686656)))]; |
| tensor<fp16, [1, 256, 1024]> linear_24_cast_fp16 = linear(bias = encoder_layers_4_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_q_proj_weight_to_fp16, x = hidden_states_19_cast_fp16)[name = tensor<string, []>("linear_24_cast_fp16")]; |
| tensor<int32, [4]> var_374 = const()[name = tensor<string, []>("op_374"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_375_cast_fp16 = reshape(shape = var_374, x = linear_24_cast_fp16)[name = tensor<string, []>("op_375_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_4_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(629688768)))]; |
| tensor<fp16, [1024]> encoder_layers_4_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(631785984)))]; |
| tensor<fp16, [1, 256, 1024]> linear_25_cast_fp16 = linear(bias = encoder_layers_4_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_k_proj_weight_to_fp16, x = hidden_states_19_cast_fp16)[name = tensor<string, []>("linear_25_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_4_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(631788096)))]; |
| tensor<fp16, [1024]> encoder_layers_4_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(633885312)))]; |
| tensor<fp16, [1, 256, 1024]> linear_26_cast_fp16 = linear(bias = encoder_layers_4_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_v_proj_weight_to_fp16, x = hidden_states_19_cast_fp16)[name = tensor<string, []>("linear_26_cast_fp16")]; |
| tensor<int32, [4]> var_383 = const()[name = tensor<string, []>("op_383"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_384_cast_fp16 = reshape(shape = var_383, x = linear_25_cast_fp16)[name = tensor<string, []>("op_384_cast_fp16")]; |
| tensor<int32, [4]> var_386 = const()[name = tensor<string, []>("op_386"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_387_cast_fp16 = reshape(shape = var_386, x = linear_26_cast_fp16)[name = tensor<string, []>("op_387_cast_fp16")]; |
| tensor<int32, [4]> value_10_perm_0 = const()[name = tensor<string, []>("value_10_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_390_transpose_x_0 = const()[name = tensor<string, []>("op_390_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_390_transpose_y_0 = const()[name = tensor<string, []>("op_390_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_44_perm_0 = const()[name = tensor<string, []>("transpose_44_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_45_perm_0 = const()[name = tensor<string, []>("transpose_45_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_45 = transpose(perm = transpose_45_perm_0, x = var_384_cast_fp16)[name = tensor<string, []>("transpose_89")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_44 = transpose(perm = transpose_44_perm_0, x = var_375_cast_fp16)[name = tensor<string, []>("transpose_90")]; |
| tensor<fp16, [1, 16, 256, 256]> var_390_cast_fp16 = matmul(transpose_x = var_390_transpose_x_0, transpose_y = var_390_transpose_y_0, x = transpose_44, y = transpose_45)[name = tensor<string, []>("op_390_cast_fp16")]; |
| tensor<fp16, []> var_391_to_fp16 = const()[name = tensor<string, []>("op_391_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_10_cast_fp16 = mul(x = var_390_cast_fp16, y = var_391_to_fp16)[name = tensor<string, []>("attn_weights_10_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_29_cast_fp16 = add(x = attn_weights_10_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_29_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_27_cast_fp16 = softmax(axis = var_18, x = input_29_cast_fp16)[name = tensor<string, []>("input0_27_cast_fp16")]; |
| tensor<bool, []> attn_output_10_transpose_x_0 = const()[name = tensor<string, []>("attn_output_10_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_10_transpose_y_0 = const()[name = tensor<string, []>("attn_output_10_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_10_cast_fp16 = transpose(perm = value_10_perm_0, x = var_387_cast_fp16)[name = tensor<string, []>("transpose_91")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_10_cast_fp16 = matmul(transpose_x = attn_output_10_transpose_x_0, transpose_y = attn_output_10_transpose_y_0, x = input0_27_cast_fp16, y = value_10_cast_fp16)[name = tensor<string, []>("attn_output_10_cast_fp16")]; |
| tensor<int32, [4]> var_397_perm_0 = const()[name = tensor<string, []>("op_397_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_399 = const()[name = tensor<string, []>("op_399"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_397_cast_fp16 = transpose(perm = var_397_perm_0, x = attn_output_10_cast_fp16)[name = tensor<string, []>("transpose_88")]; |
| tensor<fp16, [1, 256, 1024]> var_400_cast_fp16 = reshape(shape = var_399, x = var_397_cast_fp16)[name = tensor<string, []>("op_400_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_4_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(633887424)))]; |
| tensor<fp16, [1024]> encoder_layers_4_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(635984640)))]; |
| tensor<fp16, [1, 256, 1024]> linear_27_cast_fp16 = linear(bias = encoder_layers_4_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_out_proj_weight_to_fp16, x = var_400_cast_fp16)[name = tensor<string, []>("linear_27_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_31_cast_fp16 = add(x = var_355_cast_fp16, y = linear_27_cast_fp16)[name = tensor<string, []>("input_31_cast_fp16")]; |
| tensor<int32, [1]> input0_29_axes_0 = const()[name = tensor<string, []>("input0_29_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_4_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(635986752)))]; |
| tensor<fp16, [1024]> encoder_layers_4_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(635988864)))]; |
| tensor<fp16, [1, 256, 1024]> input0_29_cast_fp16 = layer_norm(axes = input0_29_axes_0, beta = encoder_layers_4_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_4_final_layer_norm_weight_to_fp16, x = input_31_cast_fp16)[name = tensor<string, []>("input0_29_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_4_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(635990976)))]; |
| tensor<fp16, [4096]> encoder_layers_4_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(644379648)))]; |
| tensor<fp16, [1, 256, 4096]> linear_28_cast_fp16 = linear(bias = encoder_layers_4_fc1_bias_to_fp16, weight = encoder_layers_4_fc1_weight_to_fp16, x = input0_29_cast_fp16)[name = tensor<string, []>("linear_28_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_414_cast_fp16 = relu(x = linear_28_cast_fp16)[name = tensor<string, []>("op_414_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_4_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(644387904)))]; |
| tensor<fp16, [1024]> encoder_layers_4_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_4_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(652776576)))]; |
| tensor<fp16, [1, 256, 1024]> linear_29_cast_fp16 = linear(bias = encoder_layers_4_fc2_bias_to_fp16, weight = encoder_layers_4_fc2_weight_to_fp16, x = var_414_cast_fp16)[name = tensor<string, []>("linear_29_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_420_cast_fp16 = add(x = input_31_cast_fp16, y = linear_29_cast_fp16)[name = tensor<string, []>("op_420_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_23_axes_0 = const()[name = tensor<string, []>("hidden_states_23_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_5_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(652778688)))]; |
| tensor<fp16, [1024]> encoder_layers_5_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(652780800)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_23_cast_fp16 = layer_norm(axes = hidden_states_23_axes_0, beta = encoder_layers_5_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_5_self_attn_layer_norm_weight_to_fp16, x = var_420_cast_fp16)[name = tensor<string, []>("hidden_states_23_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_5_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(652782912)))]; |
| tensor<fp16, [1024]> encoder_layers_5_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(654880128)))]; |
| tensor<fp16, [1, 256, 1024]> linear_30_cast_fp16 = linear(bias = encoder_layers_5_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_q_proj_weight_to_fp16, x = hidden_states_23_cast_fp16)[name = tensor<string, []>("linear_30_cast_fp16")]; |
| tensor<int32, [4]> var_439 = const()[name = tensor<string, []>("op_439"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_440_cast_fp16 = reshape(shape = var_439, x = linear_30_cast_fp16)[name = tensor<string, []>("op_440_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_5_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(654882240)))]; |
| tensor<fp16, [1024]> encoder_layers_5_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(656979456)))]; |
| tensor<fp16, [1, 256, 1024]> linear_31_cast_fp16 = linear(bias = encoder_layers_5_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_k_proj_weight_to_fp16, x = hidden_states_23_cast_fp16)[name = tensor<string, []>("linear_31_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_5_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(656981568)))]; |
| tensor<fp16, [1024]> encoder_layers_5_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(659078784)))]; |
| tensor<fp16, [1, 256, 1024]> linear_32_cast_fp16 = linear(bias = encoder_layers_5_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_v_proj_weight_to_fp16, x = hidden_states_23_cast_fp16)[name = tensor<string, []>("linear_32_cast_fp16")]; |
| tensor<int32, [4]> var_448 = const()[name = tensor<string, []>("op_448"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_449_cast_fp16 = reshape(shape = var_448, x = linear_31_cast_fp16)[name = tensor<string, []>("op_449_cast_fp16")]; |
| tensor<int32, [4]> var_451 = const()[name = tensor<string, []>("op_451"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_452_cast_fp16 = reshape(shape = var_451, x = linear_32_cast_fp16)[name = tensor<string, []>("op_452_cast_fp16")]; |
| tensor<int32, [4]> value_12_perm_0 = const()[name = tensor<string, []>("value_12_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_455_transpose_x_0 = const()[name = tensor<string, []>("op_455_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_455_transpose_y_0 = const()[name = tensor<string, []>("op_455_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_46_perm_0 = const()[name = tensor<string, []>("transpose_46_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_47_perm_0 = const()[name = tensor<string, []>("transpose_47_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_47 = transpose(perm = transpose_47_perm_0, x = var_449_cast_fp16)[name = tensor<string, []>("transpose_85")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_46 = transpose(perm = transpose_46_perm_0, x = var_440_cast_fp16)[name = tensor<string, []>("transpose_86")]; |
| tensor<fp16, [1, 16, 256, 256]> var_455_cast_fp16 = matmul(transpose_x = var_455_transpose_x_0, transpose_y = var_455_transpose_y_0, x = transpose_46, y = transpose_47)[name = tensor<string, []>("op_455_cast_fp16")]; |
| tensor<fp16, []> var_456_to_fp16 = const()[name = tensor<string, []>("op_456_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_12_cast_fp16 = mul(x = var_455_cast_fp16, y = var_456_to_fp16)[name = tensor<string, []>("attn_weights_12_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_35_cast_fp16 = add(x = attn_weights_12_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_35_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_33_cast_fp16 = softmax(axis = var_18, x = input_35_cast_fp16)[name = tensor<string, []>("input0_33_cast_fp16")]; |
| tensor<bool, []> attn_output_12_transpose_x_0 = const()[name = tensor<string, []>("attn_output_12_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_12_transpose_y_0 = const()[name = tensor<string, []>("attn_output_12_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_12_cast_fp16 = transpose(perm = value_12_perm_0, x = var_452_cast_fp16)[name = tensor<string, []>("transpose_87")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_12_cast_fp16 = matmul(transpose_x = attn_output_12_transpose_x_0, transpose_y = attn_output_12_transpose_y_0, x = input0_33_cast_fp16, y = value_12_cast_fp16)[name = tensor<string, []>("attn_output_12_cast_fp16")]; |
| tensor<int32, [4]> var_462_perm_0 = const()[name = tensor<string, []>("op_462_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_464 = const()[name = tensor<string, []>("op_464"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_462_cast_fp16 = transpose(perm = var_462_perm_0, x = attn_output_12_cast_fp16)[name = tensor<string, []>("transpose_84")]; |
| tensor<fp16, [1, 256, 1024]> var_465_cast_fp16 = reshape(shape = var_464, x = var_462_cast_fp16)[name = tensor<string, []>("op_465_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_5_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(659080896)))]; |
| tensor<fp16, [1024]> encoder_layers_5_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(661178112)))]; |
| tensor<fp16, [1, 256, 1024]> linear_33_cast_fp16 = linear(bias = encoder_layers_5_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_out_proj_weight_to_fp16, x = var_465_cast_fp16)[name = tensor<string, []>("linear_33_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_37_cast_fp16 = add(x = var_420_cast_fp16, y = linear_33_cast_fp16)[name = tensor<string, []>("input_37_cast_fp16")]; |
| tensor<int32, [1]> input0_35_axes_0 = const()[name = tensor<string, []>("input0_35_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_5_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(661180224)))]; |
| tensor<fp16, [1024]> encoder_layers_5_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(661182336)))]; |
| tensor<fp16, [1, 256, 1024]> input0_35_cast_fp16 = layer_norm(axes = input0_35_axes_0, beta = encoder_layers_5_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_5_final_layer_norm_weight_to_fp16, x = input_37_cast_fp16)[name = tensor<string, []>("input0_35_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_5_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(661184448)))]; |
| tensor<fp16, [4096]> encoder_layers_5_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(669573120)))]; |
| tensor<fp16, [1, 256, 4096]> linear_34_cast_fp16 = linear(bias = encoder_layers_5_fc1_bias_to_fp16, weight = encoder_layers_5_fc1_weight_to_fp16, x = input0_35_cast_fp16)[name = tensor<string, []>("linear_34_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_479_cast_fp16 = relu(x = linear_34_cast_fp16)[name = tensor<string, []>("op_479_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_5_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(669581376)))]; |
| tensor<fp16, [1024]> encoder_layers_5_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_5_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(677970048)))]; |
| tensor<fp16, [1, 256, 1024]> linear_35_cast_fp16 = linear(bias = encoder_layers_5_fc2_bias_to_fp16, weight = encoder_layers_5_fc2_weight_to_fp16, x = var_479_cast_fp16)[name = tensor<string, []>("linear_35_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_485_cast_fp16 = add(x = input_37_cast_fp16, y = linear_35_cast_fp16)[name = tensor<string, []>("op_485_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_27_axes_0 = const()[name = tensor<string, []>("hidden_states_27_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_6_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(677972160)))]; |
| tensor<fp16, [1024]> encoder_layers_6_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(677974272)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_27_cast_fp16 = layer_norm(axes = hidden_states_27_axes_0, beta = encoder_layers_6_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_6_self_attn_layer_norm_weight_to_fp16, x = var_485_cast_fp16)[name = tensor<string, []>("hidden_states_27_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_6_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(677976384)))]; |
| tensor<fp16, [1024]> encoder_layers_6_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(680073600)))]; |
| tensor<fp16, [1, 256, 1024]> linear_36_cast_fp16 = linear(bias = encoder_layers_6_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_q_proj_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor<string, []>("linear_36_cast_fp16")]; |
| tensor<int32, [4]> var_504 = const()[name = tensor<string, []>("op_504"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_505_cast_fp16 = reshape(shape = var_504, x = linear_36_cast_fp16)[name = tensor<string, []>("op_505_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_6_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(680075712)))]; |
| tensor<fp16, [1024]> encoder_layers_6_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(682172928)))]; |
| tensor<fp16, [1, 256, 1024]> linear_37_cast_fp16 = linear(bias = encoder_layers_6_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_k_proj_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor<string, []>("linear_37_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_6_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(682175040)))]; |
| tensor<fp16, [1024]> encoder_layers_6_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(684272256)))]; |
| tensor<fp16, [1, 256, 1024]> linear_38_cast_fp16 = linear(bias = encoder_layers_6_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_v_proj_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor<string, []>("linear_38_cast_fp16")]; |
| tensor<int32, [4]> var_513 = const()[name = tensor<string, []>("op_513"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_514_cast_fp16 = reshape(shape = var_513, x = linear_37_cast_fp16)[name = tensor<string, []>("op_514_cast_fp16")]; |
| tensor<int32, [4]> var_516 = const()[name = tensor<string, []>("op_516"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_517_cast_fp16 = reshape(shape = var_516, x = linear_38_cast_fp16)[name = tensor<string, []>("op_517_cast_fp16")]; |
| tensor<int32, [4]> value_14_perm_0 = const()[name = tensor<string, []>("value_14_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_520_transpose_x_0 = const()[name = tensor<string, []>("op_520_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_520_transpose_y_0 = const()[name = tensor<string, []>("op_520_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_48_perm_0 = const()[name = tensor<string, []>("transpose_48_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_49_perm_0 = const()[name = tensor<string, []>("transpose_49_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_49 = transpose(perm = transpose_49_perm_0, x = var_514_cast_fp16)[name = tensor<string, []>("transpose_81")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_48 = transpose(perm = transpose_48_perm_0, x = var_505_cast_fp16)[name = tensor<string, []>("transpose_82")]; |
| tensor<fp16, [1, 16, 256, 256]> var_520_cast_fp16 = matmul(transpose_x = var_520_transpose_x_0, transpose_y = var_520_transpose_y_0, x = transpose_48, y = transpose_49)[name = tensor<string, []>("op_520_cast_fp16")]; |
| tensor<fp16, []> var_521_to_fp16 = const()[name = tensor<string, []>("op_521_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_14_cast_fp16 = mul(x = var_520_cast_fp16, y = var_521_to_fp16)[name = tensor<string, []>("attn_weights_14_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_41_cast_fp16 = add(x = attn_weights_14_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_41_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_39_cast_fp16 = softmax(axis = var_18, x = input_41_cast_fp16)[name = tensor<string, []>("input0_39_cast_fp16")]; |
| tensor<bool, []> attn_output_14_transpose_x_0 = const()[name = tensor<string, []>("attn_output_14_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_14_transpose_y_0 = const()[name = tensor<string, []>("attn_output_14_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_14_cast_fp16 = transpose(perm = value_14_perm_0, x = var_517_cast_fp16)[name = tensor<string, []>("transpose_83")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_14_cast_fp16 = matmul(transpose_x = attn_output_14_transpose_x_0, transpose_y = attn_output_14_transpose_y_0, x = input0_39_cast_fp16, y = value_14_cast_fp16)[name = tensor<string, []>("attn_output_14_cast_fp16")]; |
| tensor<int32, [4]> var_527_perm_0 = const()[name = tensor<string, []>("op_527_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_529 = const()[name = tensor<string, []>("op_529"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_527_cast_fp16 = transpose(perm = var_527_perm_0, x = attn_output_14_cast_fp16)[name = tensor<string, []>("transpose_80")]; |
| tensor<fp16, [1, 256, 1024]> var_530_cast_fp16 = reshape(shape = var_529, x = var_527_cast_fp16)[name = tensor<string, []>("op_530_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_6_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(684274368)))]; |
| tensor<fp16, [1024]> encoder_layers_6_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(686371584)))]; |
| tensor<fp16, [1, 256, 1024]> linear_39_cast_fp16 = linear(bias = encoder_layers_6_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_out_proj_weight_to_fp16, x = var_530_cast_fp16)[name = tensor<string, []>("linear_39_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_43_cast_fp16 = add(x = var_485_cast_fp16, y = linear_39_cast_fp16)[name = tensor<string, []>("input_43_cast_fp16")]; |
| tensor<int32, [1]> input0_41_axes_0 = const()[name = tensor<string, []>("input0_41_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_6_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(686373696)))]; |
| tensor<fp16, [1024]> encoder_layers_6_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(686375808)))]; |
| tensor<fp16, [1, 256, 1024]> input0_41_cast_fp16 = layer_norm(axes = input0_41_axes_0, beta = encoder_layers_6_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_6_final_layer_norm_weight_to_fp16, x = input_43_cast_fp16)[name = tensor<string, []>("input0_41_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_6_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(686377920)))]; |
| tensor<fp16, [4096]> encoder_layers_6_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(694766592)))]; |
| tensor<fp16, [1, 256, 4096]> linear_40_cast_fp16 = linear(bias = encoder_layers_6_fc1_bias_to_fp16, weight = encoder_layers_6_fc1_weight_to_fp16, x = input0_41_cast_fp16)[name = tensor<string, []>("linear_40_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_544_cast_fp16 = relu(x = linear_40_cast_fp16)[name = tensor<string, []>("op_544_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_6_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(694774848)))]; |
| tensor<fp16, [1024]> encoder_layers_6_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_6_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(703163520)))]; |
| tensor<fp16, [1, 256, 1024]> linear_41_cast_fp16 = linear(bias = encoder_layers_6_fc2_bias_to_fp16, weight = encoder_layers_6_fc2_weight_to_fp16, x = var_544_cast_fp16)[name = tensor<string, []>("linear_41_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_550_cast_fp16 = add(x = input_43_cast_fp16, y = linear_41_cast_fp16)[name = tensor<string, []>("op_550_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_31_axes_0 = const()[name = tensor<string, []>("hidden_states_31_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_7_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(703165632)))]; |
| tensor<fp16, [1024]> encoder_layers_7_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(703167744)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_31_cast_fp16 = layer_norm(axes = hidden_states_31_axes_0, beta = encoder_layers_7_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_7_self_attn_layer_norm_weight_to_fp16, x = var_550_cast_fp16)[name = tensor<string, []>("hidden_states_31_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_7_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(703169856)))]; |
| tensor<fp16, [1024]> encoder_layers_7_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(705267072)))]; |
| tensor<fp16, [1, 256, 1024]> linear_42_cast_fp16 = linear(bias = encoder_layers_7_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_q_proj_weight_to_fp16, x = hidden_states_31_cast_fp16)[name = tensor<string, []>("linear_42_cast_fp16")]; |
| tensor<int32, [4]> var_569 = const()[name = tensor<string, []>("op_569"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_570_cast_fp16 = reshape(shape = var_569, x = linear_42_cast_fp16)[name = tensor<string, []>("op_570_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_7_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(705269184)))]; |
| tensor<fp16, [1024]> encoder_layers_7_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(707366400)))]; |
| tensor<fp16, [1, 256, 1024]> linear_43_cast_fp16 = linear(bias = encoder_layers_7_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_k_proj_weight_to_fp16, x = hidden_states_31_cast_fp16)[name = tensor<string, []>("linear_43_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_7_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(707368512)))]; |
| tensor<fp16, [1024]> encoder_layers_7_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(709465728)))]; |
| tensor<fp16, [1, 256, 1024]> linear_44_cast_fp16 = linear(bias = encoder_layers_7_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_v_proj_weight_to_fp16, x = hidden_states_31_cast_fp16)[name = tensor<string, []>("linear_44_cast_fp16")]; |
| tensor<int32, [4]> var_578 = const()[name = tensor<string, []>("op_578"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_579_cast_fp16 = reshape(shape = var_578, x = linear_43_cast_fp16)[name = tensor<string, []>("op_579_cast_fp16")]; |
| tensor<int32, [4]> var_581 = const()[name = tensor<string, []>("op_581"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_582_cast_fp16 = reshape(shape = var_581, x = linear_44_cast_fp16)[name = tensor<string, []>("op_582_cast_fp16")]; |
| tensor<int32, [4]> value_16_perm_0 = const()[name = tensor<string, []>("value_16_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_585_transpose_x_0 = const()[name = tensor<string, []>("op_585_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_585_transpose_y_0 = const()[name = tensor<string, []>("op_585_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_50_perm_0 = const()[name = tensor<string, []>("transpose_50_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_51_perm_0 = const()[name = tensor<string, []>("transpose_51_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_51 = transpose(perm = transpose_51_perm_0, x = var_579_cast_fp16)[name = tensor<string, []>("transpose_77")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_50 = transpose(perm = transpose_50_perm_0, x = var_570_cast_fp16)[name = tensor<string, []>("transpose_78")]; |
| tensor<fp16, [1, 16, 256, 256]> var_585_cast_fp16 = matmul(transpose_x = var_585_transpose_x_0, transpose_y = var_585_transpose_y_0, x = transpose_50, y = transpose_51)[name = tensor<string, []>("op_585_cast_fp16")]; |
| tensor<fp16, []> var_586_to_fp16 = const()[name = tensor<string, []>("op_586_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_16_cast_fp16 = mul(x = var_585_cast_fp16, y = var_586_to_fp16)[name = tensor<string, []>("attn_weights_16_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_47_cast_fp16 = add(x = attn_weights_16_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_47_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_45_cast_fp16 = softmax(axis = var_18, x = input_47_cast_fp16)[name = tensor<string, []>("input0_45_cast_fp16")]; |
| tensor<bool, []> attn_output_16_transpose_x_0 = const()[name = tensor<string, []>("attn_output_16_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_16_transpose_y_0 = const()[name = tensor<string, []>("attn_output_16_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_16_cast_fp16 = transpose(perm = value_16_perm_0, x = var_582_cast_fp16)[name = tensor<string, []>("transpose_79")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_16_cast_fp16 = matmul(transpose_x = attn_output_16_transpose_x_0, transpose_y = attn_output_16_transpose_y_0, x = input0_45_cast_fp16, y = value_16_cast_fp16)[name = tensor<string, []>("attn_output_16_cast_fp16")]; |
| tensor<int32, [4]> var_592_perm_0 = const()[name = tensor<string, []>("op_592_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_594 = const()[name = tensor<string, []>("op_594"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_592_cast_fp16 = transpose(perm = var_592_perm_0, x = attn_output_16_cast_fp16)[name = tensor<string, []>("transpose_76")]; |
| tensor<fp16, [1, 256, 1024]> var_595_cast_fp16 = reshape(shape = var_594, x = var_592_cast_fp16)[name = tensor<string, []>("op_595_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_7_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(709467840)))]; |
| tensor<fp16, [1024]> encoder_layers_7_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(711565056)))]; |
| tensor<fp16, [1, 256, 1024]> linear_45_cast_fp16 = linear(bias = encoder_layers_7_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_out_proj_weight_to_fp16, x = var_595_cast_fp16)[name = tensor<string, []>("linear_45_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_49_cast_fp16 = add(x = var_550_cast_fp16, y = linear_45_cast_fp16)[name = tensor<string, []>("input_49_cast_fp16")]; |
| tensor<int32, [1]> input0_47_axes_0 = const()[name = tensor<string, []>("input0_47_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_7_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(711567168)))]; |
| tensor<fp16, [1024]> encoder_layers_7_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(711569280)))]; |
| tensor<fp16, [1, 256, 1024]> input0_47_cast_fp16 = layer_norm(axes = input0_47_axes_0, beta = encoder_layers_7_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_7_final_layer_norm_weight_to_fp16, x = input_49_cast_fp16)[name = tensor<string, []>("input0_47_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_7_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(711571392)))]; |
| tensor<fp16, [4096]> encoder_layers_7_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(719960064)))]; |
| tensor<fp16, [1, 256, 4096]> linear_46_cast_fp16 = linear(bias = encoder_layers_7_fc1_bias_to_fp16, weight = encoder_layers_7_fc1_weight_to_fp16, x = input0_47_cast_fp16)[name = tensor<string, []>("linear_46_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_609_cast_fp16 = relu(x = linear_46_cast_fp16)[name = tensor<string, []>("op_609_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_7_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(719968320)))]; |
| tensor<fp16, [1024]> encoder_layers_7_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_7_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(728356992)))]; |
| tensor<fp16, [1, 256, 1024]> linear_47_cast_fp16 = linear(bias = encoder_layers_7_fc2_bias_to_fp16, weight = encoder_layers_7_fc2_weight_to_fp16, x = var_609_cast_fp16)[name = tensor<string, []>("linear_47_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_615_cast_fp16 = add(x = input_49_cast_fp16, y = linear_47_cast_fp16)[name = tensor<string, []>("op_615_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_35_axes_0 = const()[name = tensor<string, []>("hidden_states_35_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_8_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(728359104)))]; |
| tensor<fp16, [1024]> encoder_layers_8_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(728361216)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_35_cast_fp16 = layer_norm(axes = hidden_states_35_axes_0, beta = encoder_layers_8_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_8_self_attn_layer_norm_weight_to_fp16, x = var_615_cast_fp16)[name = tensor<string, []>("hidden_states_35_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_8_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(728363328)))]; |
| tensor<fp16, [1024]> encoder_layers_8_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(730460544)))]; |
| tensor<fp16, [1, 256, 1024]> linear_48_cast_fp16 = linear(bias = encoder_layers_8_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_q_proj_weight_to_fp16, x = hidden_states_35_cast_fp16)[name = tensor<string, []>("linear_48_cast_fp16")]; |
| tensor<int32, [4]> var_634 = const()[name = tensor<string, []>("op_634"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_635_cast_fp16 = reshape(shape = var_634, x = linear_48_cast_fp16)[name = tensor<string, []>("op_635_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_8_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(730462656)))]; |
| tensor<fp16, [1024]> encoder_layers_8_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(732559872)))]; |
| tensor<fp16, [1, 256, 1024]> linear_49_cast_fp16 = linear(bias = encoder_layers_8_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_k_proj_weight_to_fp16, x = hidden_states_35_cast_fp16)[name = tensor<string, []>("linear_49_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_8_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(732561984)))]; |
| tensor<fp16, [1024]> encoder_layers_8_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(734659200)))]; |
| tensor<fp16, [1, 256, 1024]> linear_50_cast_fp16 = linear(bias = encoder_layers_8_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_v_proj_weight_to_fp16, x = hidden_states_35_cast_fp16)[name = tensor<string, []>("linear_50_cast_fp16")]; |
| tensor<int32, [4]> var_643 = const()[name = tensor<string, []>("op_643"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_644_cast_fp16 = reshape(shape = var_643, x = linear_49_cast_fp16)[name = tensor<string, []>("op_644_cast_fp16")]; |
| tensor<int32, [4]> var_646 = const()[name = tensor<string, []>("op_646"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_647_cast_fp16 = reshape(shape = var_646, x = linear_50_cast_fp16)[name = tensor<string, []>("op_647_cast_fp16")]; |
| tensor<int32, [4]> value_18_perm_0 = const()[name = tensor<string, []>("value_18_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_650_transpose_x_0 = const()[name = tensor<string, []>("op_650_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_650_transpose_y_0 = const()[name = tensor<string, []>("op_650_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_52_perm_0 = const()[name = tensor<string, []>("transpose_52_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_53_perm_0 = const()[name = tensor<string, []>("transpose_53_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_53 = transpose(perm = transpose_53_perm_0, x = var_644_cast_fp16)[name = tensor<string, []>("transpose_73")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_52 = transpose(perm = transpose_52_perm_0, x = var_635_cast_fp16)[name = tensor<string, []>("transpose_74")]; |
| tensor<fp16, [1, 16, 256, 256]> var_650_cast_fp16 = matmul(transpose_x = var_650_transpose_x_0, transpose_y = var_650_transpose_y_0, x = transpose_52, y = transpose_53)[name = tensor<string, []>("op_650_cast_fp16")]; |
| tensor<fp16, []> var_651_to_fp16 = const()[name = tensor<string, []>("op_651_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_18_cast_fp16 = mul(x = var_650_cast_fp16, y = var_651_to_fp16)[name = tensor<string, []>("attn_weights_18_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_53_cast_fp16 = add(x = attn_weights_18_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_53_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_51_cast_fp16 = softmax(axis = var_18, x = input_53_cast_fp16)[name = tensor<string, []>("input0_51_cast_fp16")]; |
| tensor<bool, []> attn_output_18_transpose_x_0 = const()[name = tensor<string, []>("attn_output_18_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_18_transpose_y_0 = const()[name = tensor<string, []>("attn_output_18_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_18_cast_fp16 = transpose(perm = value_18_perm_0, x = var_647_cast_fp16)[name = tensor<string, []>("transpose_75")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_18_cast_fp16 = matmul(transpose_x = attn_output_18_transpose_x_0, transpose_y = attn_output_18_transpose_y_0, x = input0_51_cast_fp16, y = value_18_cast_fp16)[name = tensor<string, []>("attn_output_18_cast_fp16")]; |
| tensor<int32, [4]> var_657_perm_0 = const()[name = tensor<string, []>("op_657_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_659 = const()[name = tensor<string, []>("op_659"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_657_cast_fp16 = transpose(perm = var_657_perm_0, x = attn_output_18_cast_fp16)[name = tensor<string, []>("transpose_72")]; |
| tensor<fp16, [1, 256, 1024]> var_660_cast_fp16 = reshape(shape = var_659, x = var_657_cast_fp16)[name = tensor<string, []>("op_660_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_8_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(734661312)))]; |
| tensor<fp16, [1024]> encoder_layers_8_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(736758528)))]; |
| tensor<fp16, [1, 256, 1024]> linear_51_cast_fp16 = linear(bias = encoder_layers_8_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_out_proj_weight_to_fp16, x = var_660_cast_fp16)[name = tensor<string, []>("linear_51_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_55_cast_fp16 = add(x = var_615_cast_fp16, y = linear_51_cast_fp16)[name = tensor<string, []>("input_55_cast_fp16")]; |
| tensor<int32, [1]> input0_53_axes_0 = const()[name = tensor<string, []>("input0_53_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_8_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(736760640)))]; |
| tensor<fp16, [1024]> encoder_layers_8_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(736762752)))]; |
| tensor<fp16, [1, 256, 1024]> input0_53_cast_fp16 = layer_norm(axes = input0_53_axes_0, beta = encoder_layers_8_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_8_final_layer_norm_weight_to_fp16, x = input_55_cast_fp16)[name = tensor<string, []>("input0_53_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_8_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(736764864)))]; |
| tensor<fp16, [4096]> encoder_layers_8_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(745153536)))]; |
| tensor<fp16, [1, 256, 4096]> linear_52_cast_fp16 = linear(bias = encoder_layers_8_fc1_bias_to_fp16, weight = encoder_layers_8_fc1_weight_to_fp16, x = input0_53_cast_fp16)[name = tensor<string, []>("linear_52_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_674_cast_fp16 = relu(x = linear_52_cast_fp16)[name = tensor<string, []>("op_674_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_8_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(745161792)))]; |
| tensor<fp16, [1024]> encoder_layers_8_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_8_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(753550464)))]; |
| tensor<fp16, [1, 256, 1024]> linear_53_cast_fp16 = linear(bias = encoder_layers_8_fc2_bias_to_fp16, weight = encoder_layers_8_fc2_weight_to_fp16, x = var_674_cast_fp16)[name = tensor<string, []>("linear_53_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_680_cast_fp16 = add(x = input_55_cast_fp16, y = linear_53_cast_fp16)[name = tensor<string, []>("op_680_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_39_axes_0 = const()[name = tensor<string, []>("hidden_states_39_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_9_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(753552576)))]; |
| tensor<fp16, [1024]> encoder_layers_9_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(753554688)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_39_cast_fp16 = layer_norm(axes = hidden_states_39_axes_0, beta = encoder_layers_9_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_9_self_attn_layer_norm_weight_to_fp16, x = var_680_cast_fp16)[name = tensor<string, []>("hidden_states_39_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_9_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(753556800)))]; |
| tensor<fp16, [1024]> encoder_layers_9_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(755654016)))]; |
| tensor<fp16, [1, 256, 1024]> linear_54_cast_fp16 = linear(bias = encoder_layers_9_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_q_proj_weight_to_fp16, x = hidden_states_39_cast_fp16)[name = tensor<string, []>("linear_54_cast_fp16")]; |
| tensor<int32, [4]> var_699 = const()[name = tensor<string, []>("op_699"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_700_cast_fp16 = reshape(shape = var_699, x = linear_54_cast_fp16)[name = tensor<string, []>("op_700_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_9_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(755656128)))]; |
| tensor<fp16, [1024]> encoder_layers_9_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(757753344)))]; |
| tensor<fp16, [1, 256, 1024]> linear_55_cast_fp16 = linear(bias = encoder_layers_9_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_k_proj_weight_to_fp16, x = hidden_states_39_cast_fp16)[name = tensor<string, []>("linear_55_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_9_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(757755456)))]; |
| tensor<fp16, [1024]> encoder_layers_9_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(759852672)))]; |
| tensor<fp16, [1, 256, 1024]> linear_56_cast_fp16 = linear(bias = encoder_layers_9_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_v_proj_weight_to_fp16, x = hidden_states_39_cast_fp16)[name = tensor<string, []>("linear_56_cast_fp16")]; |
| tensor<int32, [4]> var_708 = const()[name = tensor<string, []>("op_708"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_709_cast_fp16 = reshape(shape = var_708, x = linear_55_cast_fp16)[name = tensor<string, []>("op_709_cast_fp16")]; |
| tensor<int32, [4]> var_711 = const()[name = tensor<string, []>("op_711"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_712_cast_fp16 = reshape(shape = var_711, x = linear_56_cast_fp16)[name = tensor<string, []>("op_712_cast_fp16")]; |
| tensor<int32, [4]> value_20_perm_0 = const()[name = tensor<string, []>("value_20_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_715_transpose_x_0 = const()[name = tensor<string, []>("op_715_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_715_transpose_y_0 = const()[name = tensor<string, []>("op_715_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_54_perm_0 = const()[name = tensor<string, []>("transpose_54_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_55_perm_0 = const()[name = tensor<string, []>("transpose_55_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_55 = transpose(perm = transpose_55_perm_0, x = var_709_cast_fp16)[name = tensor<string, []>("transpose_69")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_54 = transpose(perm = transpose_54_perm_0, x = var_700_cast_fp16)[name = tensor<string, []>("transpose_70")]; |
| tensor<fp16, [1, 16, 256, 256]> var_715_cast_fp16 = matmul(transpose_x = var_715_transpose_x_0, transpose_y = var_715_transpose_y_0, x = transpose_54, y = transpose_55)[name = tensor<string, []>("op_715_cast_fp16")]; |
| tensor<fp16, []> var_716_to_fp16 = const()[name = tensor<string, []>("op_716_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_20_cast_fp16 = mul(x = var_715_cast_fp16, y = var_716_to_fp16)[name = tensor<string, []>("attn_weights_20_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_59_cast_fp16 = add(x = attn_weights_20_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_59_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_57_cast_fp16 = softmax(axis = var_18, x = input_59_cast_fp16)[name = tensor<string, []>("input0_57_cast_fp16")]; |
| tensor<bool, []> attn_output_20_transpose_x_0 = const()[name = tensor<string, []>("attn_output_20_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_20_transpose_y_0 = const()[name = tensor<string, []>("attn_output_20_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_20_cast_fp16 = transpose(perm = value_20_perm_0, x = var_712_cast_fp16)[name = tensor<string, []>("transpose_71")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_20_cast_fp16 = matmul(transpose_x = attn_output_20_transpose_x_0, transpose_y = attn_output_20_transpose_y_0, x = input0_57_cast_fp16, y = value_20_cast_fp16)[name = tensor<string, []>("attn_output_20_cast_fp16")]; |
| tensor<int32, [4]> var_722_perm_0 = const()[name = tensor<string, []>("op_722_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_724 = const()[name = tensor<string, []>("op_724"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_722_cast_fp16 = transpose(perm = var_722_perm_0, x = attn_output_20_cast_fp16)[name = tensor<string, []>("transpose_68")]; |
| tensor<fp16, [1, 256, 1024]> var_725_cast_fp16 = reshape(shape = var_724, x = var_722_cast_fp16)[name = tensor<string, []>("op_725_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_9_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(759854784)))]; |
| tensor<fp16, [1024]> encoder_layers_9_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(761952000)))]; |
| tensor<fp16, [1, 256, 1024]> linear_57_cast_fp16 = linear(bias = encoder_layers_9_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_out_proj_weight_to_fp16, x = var_725_cast_fp16)[name = tensor<string, []>("linear_57_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_61_cast_fp16 = add(x = var_680_cast_fp16, y = linear_57_cast_fp16)[name = tensor<string, []>("input_61_cast_fp16")]; |
| tensor<int32, [1]> input0_59_axes_0 = const()[name = tensor<string, []>("input0_59_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_9_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(761954112)))]; |
| tensor<fp16, [1024]> encoder_layers_9_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(761956224)))]; |
| tensor<fp16, [1, 256, 1024]> input0_59_cast_fp16 = layer_norm(axes = input0_59_axes_0, beta = encoder_layers_9_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_9_final_layer_norm_weight_to_fp16, x = input_61_cast_fp16)[name = tensor<string, []>("input0_59_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_9_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(761958336)))]; |
| tensor<fp16, [4096]> encoder_layers_9_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(770347008)))]; |
| tensor<fp16, [1, 256, 4096]> linear_58_cast_fp16 = linear(bias = encoder_layers_9_fc1_bias_to_fp16, weight = encoder_layers_9_fc1_weight_to_fp16, x = input0_59_cast_fp16)[name = tensor<string, []>("linear_58_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_739_cast_fp16 = relu(x = linear_58_cast_fp16)[name = tensor<string, []>("op_739_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_9_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(770355264)))]; |
| tensor<fp16, [1024]> encoder_layers_9_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_9_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(778743936)))]; |
| tensor<fp16, [1, 256, 1024]> linear_59_cast_fp16 = linear(bias = encoder_layers_9_fc2_bias_to_fp16, weight = encoder_layers_9_fc2_weight_to_fp16, x = var_739_cast_fp16)[name = tensor<string, []>("linear_59_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_745_cast_fp16 = add(x = input_61_cast_fp16, y = linear_59_cast_fp16)[name = tensor<string, []>("op_745_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_43_axes_0 = const()[name = tensor<string, []>("hidden_states_43_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_10_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(778746048)))]; |
| tensor<fp16, [1024]> encoder_layers_10_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(778748160)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_43_cast_fp16 = layer_norm(axes = hidden_states_43_axes_0, beta = encoder_layers_10_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_10_self_attn_layer_norm_weight_to_fp16, x = var_745_cast_fp16)[name = tensor<string, []>("hidden_states_43_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_10_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(778750272)))]; |
| tensor<fp16, [1024]> encoder_layers_10_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(780847488)))]; |
| tensor<fp16, [1, 256, 1024]> linear_60_cast_fp16 = linear(bias = encoder_layers_10_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_q_proj_weight_to_fp16, x = hidden_states_43_cast_fp16)[name = tensor<string, []>("linear_60_cast_fp16")]; |
| tensor<int32, [4]> var_764 = const()[name = tensor<string, []>("op_764"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_765_cast_fp16 = reshape(shape = var_764, x = linear_60_cast_fp16)[name = tensor<string, []>("op_765_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_10_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(780849600)))]; |
| tensor<fp16, [1024]> encoder_layers_10_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(782946816)))]; |
| tensor<fp16, [1, 256, 1024]> linear_61_cast_fp16 = linear(bias = encoder_layers_10_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_k_proj_weight_to_fp16, x = hidden_states_43_cast_fp16)[name = tensor<string, []>("linear_61_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_10_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(782948928)))]; |
| tensor<fp16, [1024]> encoder_layers_10_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(785046144)))]; |
| tensor<fp16, [1, 256, 1024]> linear_62_cast_fp16 = linear(bias = encoder_layers_10_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_v_proj_weight_to_fp16, x = hidden_states_43_cast_fp16)[name = tensor<string, []>("linear_62_cast_fp16")]; |
| tensor<int32, [4]> var_773 = const()[name = tensor<string, []>("op_773"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_774_cast_fp16 = reshape(shape = var_773, x = linear_61_cast_fp16)[name = tensor<string, []>("op_774_cast_fp16")]; |
| tensor<int32, [4]> var_776 = const()[name = tensor<string, []>("op_776"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_777_cast_fp16 = reshape(shape = var_776, x = linear_62_cast_fp16)[name = tensor<string, []>("op_777_cast_fp16")]; |
| tensor<int32, [4]> value_22_perm_0 = const()[name = tensor<string, []>("value_22_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_780_transpose_x_0 = const()[name = tensor<string, []>("op_780_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_780_transpose_y_0 = const()[name = tensor<string, []>("op_780_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_56_perm_0 = const()[name = tensor<string, []>("transpose_56_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_57_perm_0 = const()[name = tensor<string, []>("transpose_57_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_57 = transpose(perm = transpose_57_perm_0, x = var_774_cast_fp16)[name = tensor<string, []>("transpose_65")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_56 = transpose(perm = transpose_56_perm_0, x = var_765_cast_fp16)[name = tensor<string, []>("transpose_66")]; |
| tensor<fp16, [1, 16, 256, 256]> var_780_cast_fp16 = matmul(transpose_x = var_780_transpose_x_0, transpose_y = var_780_transpose_y_0, x = transpose_56, y = transpose_57)[name = tensor<string, []>("op_780_cast_fp16")]; |
| tensor<fp16, []> var_781_to_fp16 = const()[name = tensor<string, []>("op_781_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_22_cast_fp16 = mul(x = var_780_cast_fp16, y = var_781_to_fp16)[name = tensor<string, []>("attn_weights_22_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_65_cast_fp16 = add(x = attn_weights_22_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_65_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_63_cast_fp16 = softmax(axis = var_18, x = input_65_cast_fp16)[name = tensor<string, []>("input0_63_cast_fp16")]; |
| tensor<bool, []> attn_output_22_transpose_x_0 = const()[name = tensor<string, []>("attn_output_22_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_22_transpose_y_0 = const()[name = tensor<string, []>("attn_output_22_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_22_cast_fp16 = transpose(perm = value_22_perm_0, x = var_777_cast_fp16)[name = tensor<string, []>("transpose_67")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_22_cast_fp16 = matmul(transpose_x = attn_output_22_transpose_x_0, transpose_y = attn_output_22_transpose_y_0, x = input0_63_cast_fp16, y = value_22_cast_fp16)[name = tensor<string, []>("attn_output_22_cast_fp16")]; |
| tensor<int32, [4]> var_787_perm_0 = const()[name = tensor<string, []>("op_787_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_789 = const()[name = tensor<string, []>("op_789"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_787_cast_fp16 = transpose(perm = var_787_perm_0, x = attn_output_22_cast_fp16)[name = tensor<string, []>("transpose_64")]; |
| tensor<fp16, [1, 256, 1024]> var_790_cast_fp16 = reshape(shape = var_789, x = var_787_cast_fp16)[name = tensor<string, []>("op_790_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_10_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(785048256)))]; |
| tensor<fp16, [1024]> encoder_layers_10_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(787145472)))]; |
| tensor<fp16, [1, 256, 1024]> linear_63_cast_fp16 = linear(bias = encoder_layers_10_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_out_proj_weight_to_fp16, x = var_790_cast_fp16)[name = tensor<string, []>("linear_63_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_67_cast_fp16 = add(x = var_745_cast_fp16, y = linear_63_cast_fp16)[name = tensor<string, []>("input_67_cast_fp16")]; |
| tensor<int32, [1]> input0_65_axes_0 = const()[name = tensor<string, []>("input0_65_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_10_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(787147584)))]; |
| tensor<fp16, [1024]> encoder_layers_10_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(787149696)))]; |
| tensor<fp16, [1, 256, 1024]> input0_65_cast_fp16 = layer_norm(axes = input0_65_axes_0, beta = encoder_layers_10_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_10_final_layer_norm_weight_to_fp16, x = input_67_cast_fp16)[name = tensor<string, []>("input0_65_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_10_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(787151808)))]; |
| tensor<fp16, [4096]> encoder_layers_10_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(795540480)))]; |
| tensor<fp16, [1, 256, 4096]> linear_64_cast_fp16 = linear(bias = encoder_layers_10_fc1_bias_to_fp16, weight = encoder_layers_10_fc1_weight_to_fp16, x = input0_65_cast_fp16)[name = tensor<string, []>("linear_64_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_804_cast_fp16 = relu(x = linear_64_cast_fp16)[name = tensor<string, []>("op_804_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_10_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(795548736)))]; |
| tensor<fp16, [1024]> encoder_layers_10_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_10_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(803937408)))]; |
| tensor<fp16, [1, 256, 1024]> linear_65_cast_fp16 = linear(bias = encoder_layers_10_fc2_bias_to_fp16, weight = encoder_layers_10_fc2_weight_to_fp16, x = var_804_cast_fp16)[name = tensor<string, []>("linear_65_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_810_cast_fp16 = add(x = input_67_cast_fp16, y = linear_65_cast_fp16)[name = tensor<string, []>("op_810_cast_fp16")]; |
| tensor<int32, [1]> hidden_states_1_axes_0 = const()[name = tensor<string, []>("hidden_states_1_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_11_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(803939520)))]; |
| tensor<fp16, [1024]> encoder_layers_11_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(803941632)))]; |
| tensor<fp16, [1, 256, 1024]> hidden_states_1_cast_fp16 = layer_norm(axes = hidden_states_1_axes_0, beta = encoder_layers_11_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_11_self_attn_layer_norm_weight_to_fp16, x = var_810_cast_fp16)[name = tensor<string, []>("hidden_states_1_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_11_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(803943744)))]; |
| tensor<fp16, [1024]> encoder_layers_11_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(806040960)))]; |
| tensor<fp16, [1, 256, 1024]> linear_66_cast_fp16 = linear(bias = encoder_layers_11_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_q_proj_weight_to_fp16, x = hidden_states_1_cast_fp16)[name = tensor<string, []>("linear_66_cast_fp16")]; |
| tensor<int32, [4]> var_829 = const()[name = tensor<string, []>("op_829"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_830_cast_fp16 = reshape(shape = var_829, x = linear_66_cast_fp16)[name = tensor<string, []>("op_830_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_11_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(806043072)))]; |
| tensor<fp16, [1024]> encoder_layers_11_self_attn_k_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_k_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(808140288)))]; |
| tensor<fp16, [1, 256, 1024]> linear_67_cast_fp16 = linear(bias = encoder_layers_11_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_k_proj_weight_to_fp16, x = hidden_states_1_cast_fp16)[name = tensor<string, []>("linear_67_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_11_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(808142400)))]; |
| tensor<fp16, [1024]> encoder_layers_11_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(810239616)))]; |
| tensor<fp16, [1, 256, 1024]> linear_68_cast_fp16 = linear(bias = encoder_layers_11_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_v_proj_weight_to_fp16, x = hidden_states_1_cast_fp16)[name = tensor<string, []>("linear_68_cast_fp16")]; |
| tensor<int32, [4]> var_838 = const()[name = tensor<string, []>("op_838"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_839_cast_fp16 = reshape(shape = var_838, x = linear_67_cast_fp16)[name = tensor<string, []>("op_839_cast_fp16")]; |
| tensor<int32, [4]> var_841 = const()[name = tensor<string, []>("op_841"), val = tensor<int32, [4]>([1, 256, -1, 64])]; |
| tensor<fp16, [1, 256, 16, 64]> var_842_cast_fp16 = reshape(shape = var_841, x = linear_68_cast_fp16)[name = tensor<string, []>("op_842_cast_fp16")]; |
| tensor<int32, [4]> value_1_perm_0 = const()[name = tensor<string, []>("value_1_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<bool, []> var_845_transpose_x_0 = const()[name = tensor<string, []>("op_845_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> var_845_transpose_y_0 = const()[name = tensor<string, []>("op_845_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<int32, [4]> transpose_58_perm_0 = const()[name = tensor<string, []>("transpose_58_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])]; |
| tensor<int32, [4]> transpose_59_perm_0 = const()[name = tensor<string, []>("transpose_59_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])]; |
| tensor<fp16, [1, 16, 64, 256]> transpose_59 = transpose(perm = transpose_59_perm_0, x = var_839_cast_fp16)[name = tensor<string, []>("transpose_61")]; |
| tensor<fp16, [1, 16, 256, 64]> transpose_58 = transpose(perm = transpose_58_perm_0, x = var_830_cast_fp16)[name = tensor<string, []>("transpose_62")]; |
| tensor<fp16, [1, 16, 256, 256]> var_845_cast_fp16 = matmul(transpose_x = var_845_transpose_x_0, transpose_y = var_845_transpose_y_0, x = transpose_58, y = transpose_59)[name = tensor<string, []>("op_845_cast_fp16")]; |
| tensor<fp16, []> var_846_to_fp16 = const()[name = tensor<string, []>("op_846_to_fp16"), val = tensor<fp16, []>(0x1p-3)]; |
| tensor<fp16, [1, 16, 256, 256]> attn_weights_1_cast_fp16 = mul(x = var_845_cast_fp16, y = var_846_to_fp16)[name = tensor<string, []>("attn_weights_1_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input_4_cast_fp16 = add(x = attn_weights_1_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor<string, []>("input_4_cast_fp16")]; |
| tensor<fp16, [1, 16, 256, 256]> input0_4_cast_fp16 = softmax(axis = var_18, x = input_4_cast_fp16)[name = tensor<string, []>("input0_4_cast_fp16")]; |
| tensor<bool, []> attn_output_1_transpose_x_0 = const()[name = tensor<string, []>("attn_output_1_transpose_x_0"), val = tensor<bool, []>(false)]; |
| tensor<bool, []> attn_output_1_transpose_y_0 = const()[name = tensor<string, []>("attn_output_1_transpose_y_0"), val = tensor<bool, []>(false)]; |
| tensor<fp16, [1, 16, 256, 64]> value_1_cast_fp16 = transpose(perm = value_1_perm_0, x = var_842_cast_fp16)[name = tensor<string, []>("transpose_63")]; |
| tensor<fp16, [1, 16, 256, 64]> attn_output_1_cast_fp16 = matmul(transpose_x = attn_output_1_transpose_x_0, transpose_y = attn_output_1_transpose_y_0, x = input0_4_cast_fp16, y = value_1_cast_fp16)[name = tensor<string, []>("attn_output_1_cast_fp16")]; |
| tensor<int32, [4]> var_852_perm_0 = const()[name = tensor<string, []>("op_852_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])]; |
| tensor<int32, [3]> var_854 = const()[name = tensor<string, []>("op_854"), val = tensor<int32, [3]>([1, 256, -1])]; |
| tensor<fp16, [1, 256, 16, 64]> var_852_cast_fp16 = transpose(perm = var_852_perm_0, x = attn_output_1_cast_fp16)[name = tensor<string, []>("transpose_60")]; |
| tensor<fp16, [1, 256, 1024]> var_855_cast_fp16 = reshape(shape = var_854, x = var_852_cast_fp16)[name = tensor<string, []>("op_855_cast_fp16")]; |
| tensor<fp16, [1024, 1024]> encoder_layers_11_self_attn_out_proj_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_out_proj_weight_to_fp16"), val = tensor<fp16, [1024, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(810241728)))]; |
| tensor<fp16, [1024]> encoder_layers_11_self_attn_out_proj_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_self_attn_out_proj_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(812338944)))]; |
| tensor<fp16, [1, 256, 1024]> linear_69_cast_fp16 = linear(bias = encoder_layers_11_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_out_proj_weight_to_fp16, x = var_855_cast_fp16)[name = tensor<string, []>("linear_69_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> input_2_cast_fp16 = add(x = var_810_cast_fp16, y = linear_69_cast_fp16)[name = tensor<string, []>("input_2_cast_fp16")]; |
| tensor<int32, [1]> input0_1_axes_0 = const()[name = tensor<string, []>("input0_1_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layers_11_final_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_final_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(812341056)))]; |
| tensor<fp16, [1024]> encoder_layers_11_final_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_final_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(812343168)))]; |
| tensor<fp16, [1, 256, 1024]> input0_1_cast_fp16 = layer_norm(axes = input0_1_axes_0, beta = encoder_layers_11_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_11_final_layer_norm_weight_to_fp16, x = input_2_cast_fp16)[name = tensor<string, []>("input0_1_cast_fp16")]; |
| tensor<fp16, [4096, 1024]> encoder_layers_11_fc1_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_fc1_weight_to_fp16"), val = tensor<fp16, [4096, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(812345280)))]; |
| tensor<fp16, [4096]> encoder_layers_11_fc1_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_fc1_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(820733952)))]; |
| tensor<fp16, [1, 256, 4096]> linear_70_cast_fp16 = linear(bias = encoder_layers_11_fc1_bias_to_fp16, weight = encoder_layers_11_fc1_weight_to_fp16, x = input0_1_cast_fp16)[name = tensor<string, []>("linear_70_cast_fp16")]; |
| tensor<fp16, [1, 256, 4096]> var_869_cast_fp16 = relu(x = linear_70_cast_fp16)[name = tensor<string, []>("op_869_cast_fp16")]; |
| tensor<fp16, [1024, 4096]> encoder_layers_11_fc2_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_fc2_weight_to_fp16"), val = tensor<fp16, [1024, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(820742208)))]; |
| tensor<fp16, [1024]> encoder_layers_11_fc2_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layers_11_fc2_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(829130880)))]; |
| tensor<fp16, [1, 256, 1024]> linear_71_cast_fp16 = linear(bias = encoder_layers_11_fc2_bias_to_fp16, weight = encoder_layers_11_fc2_weight_to_fp16, x = var_869_cast_fp16)[name = tensor<string, []>("linear_71_cast_fp16")]; |
| tensor<fp16, [1, 256, 1024]> var_875_cast_fp16 = add(x = input_2_cast_fp16, y = linear_71_cast_fp16)[name = tensor<string, []>("op_875_cast_fp16")]; |
| tensor<int32, [1]> var_879_axes_0 = const()[name = tensor<string, []>("op_879_axes_0"), val = tensor<int32, [1]>([-1])]; |
| tensor<fp16, [1024]> encoder_layer_norm_weight_to_fp16 = const()[name = tensor<string, []>("encoder_layer_norm_weight_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(829132992)))]; |
| tensor<fp16, [1024]> encoder_layer_norm_bias_to_fp16 = const()[name = tensor<string, []>("encoder_layer_norm_bias_to_fp16"), val = tensor<fp16, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(829135104)))]; |
| tensor<fp16, [1, 256, 1024]> var_879 = layer_norm(axes = var_879_axes_0, beta = encoder_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layer_norm_weight_to_fp16, x = var_875_cast_fp16)[name = tensor<string, []>("op_879_cast_fp16")]; |
| } -> (var_879); |
| } |