program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.10.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})] { func main(tensor attention_mask, tensor input_ids) { tensor text_branch_embeddings_word_embeddings_weight = const()[name = tensor("text_branch_embeddings_word_embeddings_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor text_branch_embeddings_position_embeddings_weight = const()[name = tensor("text_branch_embeddings_position_embeddings_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154414208)))]; tensor text_branch_embeddings_LayerNorm_bias = const()[name = tensor("text_branch_embeddings_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155993280)))]; tensor text_branch_embeddings_LayerNorm_weight = const()[name = tensor("text_branch_embeddings_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155996416)))]; tensor text_branch_encoder_layer_0_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_0_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155999552)))]; tensor text_branch_encoder_layer_0_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_0_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156002688)))]; tensor text_branch_encoder_layer_0_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_0_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158362048)))]; tensor text_branch_encoder_layer_0_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_0_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158365184)))]; tensor text_branch_encoder_layer_0_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_0_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160724544)))]; tensor text_branch_encoder_layer_0_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_0_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160727680)))]; tensor text_branch_encoder_layer_0_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_0_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163087040)))]; tensor text_branch_encoder_layer_0_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_0_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163090176)))]; tensor text_branch_encoder_layer_0_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_0_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165449536)))]; tensor text_branch_encoder_layer_0_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_0_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165452672)))]; tensor text_branch_encoder_layer_0_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_0_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165455808)))]; tensor text_branch_encoder_layer_0_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_0_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165468160)))]; tensor text_branch_encoder_layer_0_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_0_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(174905408)))]; tensor text_branch_encoder_layer_0_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_0_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(174908544)))]; tensor text_branch_encoder_layer_0_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_0_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184345792)))]; tensor text_branch_encoder_layer_0_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_0_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184348928)))]; tensor text_branch_encoder_layer_1_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_1_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184352064)))]; tensor text_branch_encoder_layer_1_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_1_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184355200)))]; tensor text_branch_encoder_layer_1_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_1_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186714560)))]; tensor text_branch_encoder_layer_1_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_1_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186717696)))]; tensor text_branch_encoder_layer_1_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_1_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(189077056)))]; tensor text_branch_encoder_layer_1_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_1_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(189080192)))]; tensor text_branch_encoder_layer_1_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_1_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(191439552)))]; tensor text_branch_encoder_layer_1_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_1_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(191442688)))]; tensor text_branch_encoder_layer_1_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_1_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193802048)))]; tensor text_branch_encoder_layer_1_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_1_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193805184)))]; tensor text_branch_encoder_layer_1_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_1_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193808320)))]; tensor text_branch_encoder_layer_1_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_1_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193820672)))]; tensor text_branch_encoder_layer_1_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_1_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(203257920)))]; tensor text_branch_encoder_layer_1_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_1_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(203261056)))]; tensor text_branch_encoder_layer_1_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_1_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(212698304)))]; tensor text_branch_encoder_layer_1_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_1_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(212701440)))]; tensor text_branch_encoder_layer_2_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_2_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(212704576)))]; tensor text_branch_encoder_layer_2_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_2_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(212707712)))]; tensor text_branch_encoder_layer_2_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_2_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215067072)))]; tensor text_branch_encoder_layer_2_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_2_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215070208)))]; tensor text_branch_encoder_layer_2_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_2_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217429568)))]; tensor text_branch_encoder_layer_2_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_2_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217432704)))]; tensor text_branch_encoder_layer_2_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_2_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219792064)))]; tensor text_branch_encoder_layer_2_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_2_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219795200)))]; tensor text_branch_encoder_layer_2_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_2_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(222154560)))]; tensor text_branch_encoder_layer_2_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_2_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(222157696)))]; tensor text_branch_encoder_layer_2_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_2_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(222160832)))]; tensor text_branch_encoder_layer_2_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_2_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(222173184)))]; tensor text_branch_encoder_layer_2_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_2_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(231610432)))]; tensor text_branch_encoder_layer_2_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_2_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(231613568)))]; tensor text_branch_encoder_layer_2_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_2_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241050816)))]; tensor text_branch_encoder_layer_2_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_2_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241053952)))]; tensor text_branch_encoder_layer_3_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_3_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241057088)))]; tensor text_branch_encoder_layer_3_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_3_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241060224)))]; tensor text_branch_encoder_layer_3_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_3_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(243419584)))]; tensor text_branch_encoder_layer_3_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_3_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(243422720)))]; tensor text_branch_encoder_layer_3_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_3_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245782080)))]; tensor text_branch_encoder_layer_3_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_3_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245785216)))]; tensor text_branch_encoder_layer_3_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_3_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(248144576)))]; tensor text_branch_encoder_layer_3_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_3_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(248147712)))]; tensor text_branch_encoder_layer_3_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_3_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250507072)))]; tensor text_branch_encoder_layer_3_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_3_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250510208)))]; tensor text_branch_encoder_layer_3_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_3_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250513344)))]; tensor text_branch_encoder_layer_3_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_3_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250525696)))]; tensor text_branch_encoder_layer_3_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_3_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259962944)))]; tensor text_branch_encoder_layer_3_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_3_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259966080)))]; tensor text_branch_encoder_layer_3_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_3_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(269403328)))]; tensor text_branch_encoder_layer_3_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_3_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(269406464)))]; tensor text_branch_encoder_layer_4_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_4_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(269409600)))]; tensor text_branch_encoder_layer_4_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_4_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(269412736)))]; tensor text_branch_encoder_layer_4_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_4_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(271772096)))]; tensor text_branch_encoder_layer_4_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_4_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(271775232)))]; tensor text_branch_encoder_layer_4_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_4_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274134592)))]; tensor text_branch_encoder_layer_4_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_4_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274137728)))]; tensor text_branch_encoder_layer_4_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_4_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(276497088)))]; tensor text_branch_encoder_layer_4_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_4_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(276500224)))]; tensor text_branch_encoder_layer_4_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_4_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278859584)))]; tensor text_branch_encoder_layer_4_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_4_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278862720)))]; tensor text_branch_encoder_layer_4_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_4_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278865856)))]; tensor text_branch_encoder_layer_4_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_4_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278878208)))]; tensor text_branch_encoder_layer_4_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_4_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288315456)))]; tensor text_branch_encoder_layer_4_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_4_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288318592)))]; tensor text_branch_encoder_layer_4_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_4_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297755840)))]; tensor text_branch_encoder_layer_4_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_4_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297758976)))]; tensor text_branch_encoder_layer_5_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_5_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297762112)))]; tensor text_branch_encoder_layer_5_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_5_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297765248)))]; tensor text_branch_encoder_layer_5_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_5_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(300124608)))]; tensor text_branch_encoder_layer_5_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_5_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(300127744)))]; tensor text_branch_encoder_layer_5_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_5_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302487104)))]; tensor text_branch_encoder_layer_5_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_5_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302490240)))]; tensor text_branch_encoder_layer_5_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_5_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304849600)))]; tensor text_branch_encoder_layer_5_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_5_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304852736)))]; tensor text_branch_encoder_layer_5_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_5_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307212096)))]; tensor text_branch_encoder_layer_5_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_5_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307215232)))]; tensor text_branch_encoder_layer_5_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_5_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307218368)))]; tensor text_branch_encoder_layer_5_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_5_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307230720)))]; tensor text_branch_encoder_layer_5_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_5_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316667968)))]; tensor text_branch_encoder_layer_5_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_5_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316671104)))]; tensor text_branch_encoder_layer_5_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_5_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(326108352)))]; tensor text_branch_encoder_layer_5_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_5_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(326111488)))]; tensor text_branch_encoder_layer_6_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_6_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(326114624)))]; tensor text_branch_encoder_layer_6_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_6_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(326117760)))]; tensor text_branch_encoder_layer_6_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_6_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(328477120)))]; tensor text_branch_encoder_layer_6_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_6_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(328480256)))]; tensor text_branch_encoder_layer_6_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_6_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(330839616)))]; tensor text_branch_encoder_layer_6_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_6_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(330842752)))]; tensor text_branch_encoder_layer_6_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_6_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(333202112)))]; tensor text_branch_encoder_layer_6_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_6_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(333205248)))]; tensor text_branch_encoder_layer_6_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_6_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335564608)))]; tensor text_branch_encoder_layer_6_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_6_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335567744)))]; tensor text_branch_encoder_layer_6_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_6_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335570880)))]; tensor text_branch_encoder_layer_6_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_6_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(335583232)))]; tensor text_branch_encoder_layer_6_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_6_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345020480)))]; tensor text_branch_encoder_layer_6_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_6_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345023616)))]; tensor text_branch_encoder_layer_6_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_6_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354460864)))]; tensor text_branch_encoder_layer_6_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_6_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354464000)))]; tensor text_branch_encoder_layer_7_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_7_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354467136)))]; tensor text_branch_encoder_layer_7_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_7_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354470272)))]; tensor text_branch_encoder_layer_7_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_7_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(356829632)))]; tensor text_branch_encoder_layer_7_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_7_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(356832768)))]; tensor text_branch_encoder_layer_7_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_7_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(359192128)))]; tensor text_branch_encoder_layer_7_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_7_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(359195264)))]; tensor text_branch_encoder_layer_7_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_7_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361554624)))]; tensor text_branch_encoder_layer_7_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_7_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361557760)))]; tensor text_branch_encoder_layer_7_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_7_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(363917120)))]; tensor text_branch_encoder_layer_7_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_7_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(363920256)))]; tensor text_branch_encoder_layer_7_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_7_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(363923392)))]; tensor text_branch_encoder_layer_7_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_7_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(363935744)))]; tensor text_branch_encoder_layer_7_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_7_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(373372992)))]; tensor text_branch_encoder_layer_7_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_7_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(373376128)))]; tensor text_branch_encoder_layer_7_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_7_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382813376)))]; tensor text_branch_encoder_layer_7_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_7_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382816512)))]; tensor text_branch_encoder_layer_8_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_8_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382819648)))]; tensor text_branch_encoder_layer_8_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_8_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382822784)))]; tensor text_branch_encoder_layer_8_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_8_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(385182144)))]; tensor text_branch_encoder_layer_8_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_8_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(385185280)))]; tensor text_branch_encoder_layer_8_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_8_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387544640)))]; tensor text_branch_encoder_layer_8_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_8_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387547776)))]; tensor text_branch_encoder_layer_8_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_8_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(389907136)))]; tensor text_branch_encoder_layer_8_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_8_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(389910272)))]; tensor text_branch_encoder_layer_8_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_8_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(392269632)))]; tensor text_branch_encoder_layer_8_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_8_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(392272768)))]; tensor text_branch_encoder_layer_8_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_8_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(392275904)))]; tensor text_branch_encoder_layer_8_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_8_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(392288256)))]; tensor text_branch_encoder_layer_8_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_8_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(401725504)))]; tensor text_branch_encoder_layer_8_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_8_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(401728640)))]; tensor text_branch_encoder_layer_8_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_8_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(411165888)))]; tensor text_branch_encoder_layer_8_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_8_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(411169024)))]; tensor text_branch_encoder_layer_9_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_9_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(411172160)))]; tensor text_branch_encoder_layer_9_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_9_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(411175296)))]; tensor text_branch_encoder_layer_9_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_9_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(413534656)))]; tensor text_branch_encoder_layer_9_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_9_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(413537792)))]; tensor text_branch_encoder_layer_9_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_9_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415897152)))]; tensor text_branch_encoder_layer_9_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_9_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415900288)))]; tensor text_branch_encoder_layer_9_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_9_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418259648)))]; tensor text_branch_encoder_layer_9_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_9_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418262784)))]; tensor text_branch_encoder_layer_9_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_9_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(420622144)))]; tensor text_branch_encoder_layer_9_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_9_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(420625280)))]; tensor text_branch_encoder_layer_9_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_9_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(420628416)))]; tensor text_branch_encoder_layer_9_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_9_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(420640768)))]; tensor text_branch_encoder_layer_9_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_9_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(430078016)))]; tensor text_branch_encoder_layer_9_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_9_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(430081152)))]; tensor text_branch_encoder_layer_9_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_9_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(439518400)))]; tensor text_branch_encoder_layer_9_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_9_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(439521536)))]; tensor text_branch_encoder_layer_10_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_10_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(439524672)))]; tensor text_branch_encoder_layer_10_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_10_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(439527808)))]; tensor text_branch_encoder_layer_10_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_10_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(441887168)))]; tensor text_branch_encoder_layer_10_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_10_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(441890304)))]; tensor text_branch_encoder_layer_10_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_10_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444249664)))]; tensor text_branch_encoder_layer_10_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_10_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444252800)))]; tensor text_branch_encoder_layer_10_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_10_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446612160)))]; tensor text_branch_encoder_layer_10_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_10_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446615296)))]; tensor text_branch_encoder_layer_10_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_10_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448974656)))]; tensor text_branch_encoder_layer_10_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_10_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448977792)))]; tensor text_branch_encoder_layer_10_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_10_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448980928)))]; tensor text_branch_encoder_layer_10_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_10_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448993280)))]; tensor text_branch_encoder_layer_10_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_10_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(458430528)))]; tensor text_branch_encoder_layer_10_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_10_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(458433664)))]; tensor text_branch_encoder_layer_10_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_10_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(467870912)))]; tensor text_branch_encoder_layer_10_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_10_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(467874048)))]; tensor text_branch_encoder_layer_11_attention_self_query_bias = const()[name = tensor("text_branch_encoder_layer_11_attention_self_query_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(467877184)))]; tensor text_branch_encoder_layer_11_attention_self_query_weight = const()[name = tensor("text_branch_encoder_layer_11_attention_self_query_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(467880320)))]; tensor text_branch_encoder_layer_11_attention_self_key_bias = const()[name = tensor("text_branch_encoder_layer_11_attention_self_key_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(470239680)))]; tensor text_branch_encoder_layer_11_attention_self_key_weight = const()[name = tensor("text_branch_encoder_layer_11_attention_self_key_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(470242816)))]; tensor text_branch_encoder_layer_11_attention_self_value_bias = const()[name = tensor("text_branch_encoder_layer_11_attention_self_value_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(472602176)))]; tensor text_branch_encoder_layer_11_attention_self_value_weight = const()[name = tensor("text_branch_encoder_layer_11_attention_self_value_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(472605312)))]; tensor text_branch_encoder_layer_11_attention_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_11_attention_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(474964672)))]; tensor text_branch_encoder_layer_11_attention_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_11_attention_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(474967808)))]; tensor text_branch_encoder_layer_11_attention_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_11_attention_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(477327168)))]; tensor text_branch_encoder_layer_11_attention_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_11_attention_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(477330304)))]; tensor text_branch_encoder_layer_11_intermediate_dense_bias = const()[name = tensor("text_branch_encoder_layer_11_intermediate_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(477333440)))]; tensor text_branch_encoder_layer_11_intermediate_dense_weight = const()[name = tensor("text_branch_encoder_layer_11_intermediate_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(477345792)))]; tensor text_branch_encoder_layer_11_output_dense_bias = const()[name = tensor("text_branch_encoder_layer_11_output_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486783040)))]; tensor text_branch_encoder_layer_11_output_dense_weight = const()[name = tensor("text_branch_encoder_layer_11_output_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486786176)))]; tensor text_branch_encoder_layer_11_output_LayerNorm_bias = const()[name = tensor("text_branch_encoder_layer_11_output_LayerNorm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496223424)))]; tensor text_branch_encoder_layer_11_output_LayerNorm_weight = const()[name = tensor("text_branch_encoder_layer_11_output_LayerNorm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496226560)))]; tensor text_branch_pooler_dense_bias = const()[name = tensor("text_branch_pooler_dense_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496229696)))]; tensor text_branch_pooler_dense_weight = const()[name = tensor("text_branch_pooler_dense_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496232832)))]; tensor text_projection_0_bias = const()[name = tensor("text_projection_0_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(498592192)))]; tensor text_projection_0_weight = const()[name = tensor("text_projection_0_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(498594304)))]; tensor text_projection_2_bias = const()[name = tensor("text_projection_2_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500167232)))]; tensor text_projection_2_weight = const()[name = tensor("text_projection_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500169344)))]; tensor var_10 = const()[name = tensor("op_10"), val = tensor(-1)]; tensor var_12 = const()[name = tensor("op_12"), val = tensor(0x1.4f8b58p-17)]; tensor var_15 = const()[name = tensor("op_15"), val = tensor(0x1p+0)]; tensor var_22 = const()[name = tensor("op_22"), val = tensor(1)]; tensor var_36_axes_0 = const()[name = tensor("op_36_axes_0"), val = tensor([1])]; tensor var_36 = expand_dims(axes = var_36_axes_0, x = attention_mask)[name = tensor("op_36")]; tensor var_37_axes_0 = const()[name = tensor("op_37_axes_0"), val = tensor([2])]; tensor var_37 = expand_dims(axes = var_37_axes_0, x = var_36)[name = tensor("op_37")]; tensor var_39_dtype_0 = const()[name = tensor("op_39_dtype_0"), val = tensor("fp32")]; tensor var_39 = cast(dtype = var_39_dtype_0, x = var_37)[name = tensor("cast_78")]; tensor var_40 = sub(x = var_15, y = var_39)[name = tensor("op_40")]; tensor var_41 = const()[name = tensor("op_41"), val = tensor(-0x1.fffffep+127)]; tensor attention_mask_1 = mul(x = var_40, y = var_41)[name = tensor("attention_mask")]; tensor var_47 = not_equal(x = input_ids, y = var_22)[name = tensor("op_47")]; tensor mask_dtype_0 = const()[name = tensor("mask_dtype_0"), val = tensor("int32")]; tensor var_49_exclusive_0 = const()[name = tensor("op_49_exclusive_0"), val = tensor(false)]; tensor var_49_reverse_0 = const()[name = tensor("op_49_reverse_0"), val = tensor(false)]; tensor mask = cast(dtype = mask_dtype_0, x = var_47)[name = tensor("cast_77")]; tensor var_49 = cumsum(axis = var_22, exclusive = var_49_exclusive_0, reverse = var_49_reverse_0, x = mask)[name = tensor("op_49")]; tensor incremental_indices = mul(x = var_49, y = mask)[name = tensor("incremental_indices")]; tensor var_55 = const()[name = tensor("op_55"), val = tensor(1)]; tensor input_3 = add(x = incremental_indices, y = var_55)[name = tensor("input_3")]; tensor inputs_embeds_batch_dims_0 = const()[name = tensor("inputs_embeds_batch_dims_0"), val = tensor(0)]; tensor inputs_embeds_validate_indices_0 = const()[name = tensor("inputs_embeds_validate_indices_0"), val = tensor(false)]; tensor greater_equal_0_y_0 = const()[name = tensor("greater_equal_0_y_0"), val = tensor(0)]; tensor greater_equal_0 = greater_equal(x = input_ids, y = greater_equal_0_y_0)[name = tensor("greater_equal_0")]; tensor slice_by_index_0 = const()[name = tensor("slice_by_index_0"), val = tensor(50265)]; tensor add_0 = add(x = input_ids, y = slice_by_index_0)[name = tensor("add_0")]; tensor select_0 = select(a = input_ids, b = add_0, cond = greater_equal_0)[name = tensor("select_0")]; tensor inputs_embeds_axis_1 = const()[name = tensor("inputs_embeds_axis_1"), val = tensor(0)]; tensor inputs_embeds = gather(axis = inputs_embeds_axis_1, batch_dims = inputs_embeds_batch_dims_0, indices = select_0, validate_indices = inputs_embeds_validate_indices_0, x = text_branch_embeddings_word_embeddings_weight)[name = tensor("inputs_embeds")]; tensor token_type_embeddings_1 = const()[name = tensor("token_type_embeddings_1"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(501217984)))]; tensor embeddings_1 = add(x = inputs_embeds, y = token_type_embeddings_1)[name = tensor("embeddings_1")]; tensor position_embeddings_1_batch_dims_0 = const()[name = tensor("position_embeddings_1_batch_dims_0"), val = tensor(0)]; tensor position_embeddings_1_validate_indices_0 = const()[name = tensor("position_embeddings_1_validate_indices_0"), val = tensor(false)]; tensor greater_equal_1_y_0 = const()[name = tensor("greater_equal_1_y_0"), val = tensor(0)]; tensor greater_equal_1 = greater_equal(x = input_3, y = greater_equal_1_y_0)[name = tensor("greater_equal_1")]; tensor slice_by_index_1 = const()[name = tensor("slice_by_index_1"), val = tensor(514)]; tensor add_1 = add(x = input_3, y = slice_by_index_1)[name = tensor("add_1")]; tensor select_1 = select(a = input_3, b = add_1, cond = greater_equal_1)[name = tensor("select_1")]; tensor position_embeddings_1_axis_1 = const()[name = tensor("position_embeddings_1_axis_1"), val = tensor(0)]; tensor position_embeddings_1 = gather(axis = position_embeddings_1_axis_1, batch_dims = position_embeddings_1_batch_dims_0, indices = select_1, validate_indices = position_embeddings_1_validate_indices_0, x = text_branch_embeddings_position_embeddings_weight)[name = tensor("position_embeddings_1")]; tensor input_5 = add(x = embeddings_1, y = position_embeddings_1)[name = tensor("input_5")]; tensor input_7_axes_0 = const()[name = tensor("input_7_axes_0"), val = tensor([-1])]; tensor input_7 = layer_norm(axes = input_7_axes_0, beta = text_branch_embeddings_LayerNorm_bias, epsilon = var_12, gamma = text_branch_embeddings_LayerNorm_weight, x = input_5)[name = tensor("input_7")]; tensor x_9 = linear(bias = text_branch_encoder_layer_0_attention_self_query_bias, weight = text_branch_encoder_layer_0_attention_self_query_weight, x = input_7)[name = tensor("linear_0")]; tensor x_1 = linear(bias = text_branch_encoder_layer_0_attention_self_key_bias, weight = text_branch_encoder_layer_0_attention_self_key_weight, x = input_7)[name = tensor("linear_1")]; tensor var_110 = const()[name = tensor("op_110"), val = tensor([1, 512, 12, 64])]; tensor x_3 = reshape(shape = var_110, x = x_1)[name = tensor("x_3")]; tensor x_5 = linear(bias = text_branch_encoder_layer_0_attention_self_value_bias, weight = text_branch_encoder_layer_0_attention_self_value_weight, x = input_7)[name = tensor("linear_2")]; tensor var_119 = const()[name = tensor("op_119"), val = tensor([1, 512, 12, 64])]; tensor x_7 = reshape(shape = var_119, x = x_5)[name = tensor("x_7")]; tensor var_121 = const()[name = tensor("op_121"), val = tensor([0, 2, 1, 3])]; tensor var_125 = const()[name = tensor("op_125"), val = tensor([1, 512, 12, 64])]; tensor x_11 = reshape(shape = var_125, x = x_9)[name = tensor("x_11")]; tensor attention_scores_1_transpose_x_0 = const()[name = tensor("attention_scores_1_transpose_x_0"), val = tensor(false)]; tensor attention_scores_1_transpose_y_0 = const()[name = tensor("attention_scores_1_transpose_y_0"), val = tensor(false)]; tensor transpose_36_perm_0 = const()[name = tensor("transpose_36_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_37_perm_0 = const()[name = tensor("transpose_37_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_37 = transpose(perm = transpose_37_perm_0, x = x_3)[name = tensor("transpose_105")]; tensor transpose_36 = transpose(perm = transpose_36_perm_0, x = x_11)[name = tensor("transpose_106")]; tensor attention_scores_1 = matmul(transpose_x = attention_scores_1_transpose_x_0, transpose_y = attention_scores_1_transpose_y_0, x = transpose_36, y = transpose_37)[name = tensor("attention_scores_1")]; tensor _inversed_attention_scores_3_y_0 = const()[name = tensor("_inversed_attention_scores_3_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_3 = mul(x = attention_scores_1, y = _inversed_attention_scores_3_y_0)[name = tensor("_inversed_attention_scores_3")]; tensor input_11 = add(x = _inversed_attention_scores_3, y = attention_mask_1)[name = tensor("input_11")]; tensor input_13 = softmax(axis = var_10, x = input_11)[name = tensor("input_13")]; tensor context_layer_1_transpose_x_0 = const()[name = tensor("context_layer_1_transpose_x_0"), val = tensor(false)]; tensor context_layer_1_transpose_y_0 = const()[name = tensor("context_layer_1_transpose_y_0"), val = tensor(false)]; tensor value_layer_1 = transpose(perm = var_121, x = x_7)[name = tensor("transpose_107")]; tensor context_layer_1 = matmul(transpose_x = context_layer_1_transpose_x_0, transpose_y = context_layer_1_transpose_y_0, x = input_13, y = value_layer_1)[name = tensor("context_layer_1")]; tensor var_137 = const()[name = tensor("op_137"), val = tensor([0, 2, 1, 3])]; tensor var_142 = const()[name = tensor("op_142"), val = tensor([1, 512, 768])]; tensor var_138 = transpose(perm = var_137, x = context_layer_1)[name = tensor("transpose_104")]; tensor input_15 = reshape(shape = var_142, x = var_138)[name = tensor("input_15")]; tensor input_17 = linear(bias = text_branch_encoder_layer_0_attention_output_dense_bias, weight = text_branch_encoder_layer_0_attention_output_dense_weight, x = input_15)[name = tensor("linear_3")]; tensor input_19 = add(x = input_17, y = input_7)[name = tensor("input_19")]; tensor input_21_axes_0 = const()[name = tensor("input_21_axes_0"), val = tensor([-1])]; tensor input_21 = layer_norm(axes = input_21_axes_0, beta = text_branch_encoder_layer_0_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_0_attention_output_LayerNorm_weight, x = input_19)[name = tensor("input_21")]; tensor input_23 = linear(bias = text_branch_encoder_layer_0_intermediate_dense_bias, weight = text_branch_encoder_layer_0_intermediate_dense_weight, x = input_21)[name = tensor("linear_4")]; tensor input_25_mode_0 = const()[name = tensor("input_25_mode_0"), val = tensor("EXACT")]; tensor input_25 = gelu(mode = input_25_mode_0, x = input_23)[name = tensor("input_25")]; tensor input_27 = linear(bias = text_branch_encoder_layer_0_output_dense_bias, weight = text_branch_encoder_layer_0_output_dense_weight, x = input_25)[name = tensor("linear_5")]; tensor input_29 = add(x = input_27, y = input_21)[name = tensor("input_29")]; tensor input_31_axes_0 = const()[name = tensor("input_31_axes_0"), val = tensor([-1])]; tensor input_31 = layer_norm(axes = input_31_axes_0, beta = text_branch_encoder_layer_0_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_0_output_LayerNorm_weight, x = input_29)[name = tensor("input_31")]; tensor x_21 = linear(bias = text_branch_encoder_layer_1_attention_self_query_bias, weight = text_branch_encoder_layer_1_attention_self_query_weight, x = input_31)[name = tensor("linear_6")]; tensor x_13 = linear(bias = text_branch_encoder_layer_1_attention_self_key_bias, weight = text_branch_encoder_layer_1_attention_self_key_weight, x = input_31)[name = tensor("linear_7")]; tensor var_187 = const()[name = tensor("op_187"), val = tensor([1, 512, 12, 64])]; tensor x_15 = reshape(shape = var_187, x = x_13)[name = tensor("x_15")]; tensor x_17 = linear(bias = text_branch_encoder_layer_1_attention_self_value_bias, weight = text_branch_encoder_layer_1_attention_self_value_weight, x = input_31)[name = tensor("linear_8")]; tensor var_196 = const()[name = tensor("op_196"), val = tensor([1, 512, 12, 64])]; tensor x_19 = reshape(shape = var_196, x = x_17)[name = tensor("x_19")]; tensor var_198 = const()[name = tensor("op_198"), val = tensor([0, 2, 1, 3])]; tensor var_202 = const()[name = tensor("op_202"), val = tensor([1, 512, 12, 64])]; tensor x_23 = reshape(shape = var_202, x = x_21)[name = tensor("x_23")]; tensor attention_scores_5_transpose_x_0 = const()[name = tensor("attention_scores_5_transpose_x_0"), val = tensor(false)]; tensor attention_scores_5_transpose_y_0 = const()[name = tensor("attention_scores_5_transpose_y_0"), val = tensor(false)]; tensor transpose_38_perm_0 = const()[name = tensor("transpose_38_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_39_perm_0 = const()[name = tensor("transpose_39_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_39 = transpose(perm = transpose_39_perm_0, x = x_15)[name = tensor("transpose_101")]; tensor transpose_38 = transpose(perm = transpose_38_perm_0, x = x_23)[name = tensor("transpose_102")]; tensor attention_scores_5 = matmul(transpose_x = attention_scores_5_transpose_x_0, transpose_y = attention_scores_5_transpose_y_0, x = transpose_38, y = transpose_39)[name = tensor("attention_scores_5")]; tensor _inversed_attention_scores_7_y_0 = const()[name = tensor("_inversed_attention_scores_7_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_7 = mul(x = attention_scores_5, y = _inversed_attention_scores_7_y_0)[name = tensor("_inversed_attention_scores_7")]; tensor input_33 = add(x = _inversed_attention_scores_7, y = attention_mask_1)[name = tensor("input_33")]; tensor input_35 = softmax(axis = var_10, x = input_33)[name = tensor("input_35")]; tensor context_layer_5_transpose_x_0 = const()[name = tensor("context_layer_5_transpose_x_0"), val = tensor(false)]; tensor context_layer_5_transpose_y_0 = const()[name = tensor("context_layer_5_transpose_y_0"), val = tensor(false)]; tensor value_layer_3 = transpose(perm = var_198, x = x_19)[name = tensor("transpose_103")]; tensor context_layer_5 = matmul(transpose_x = context_layer_5_transpose_x_0, transpose_y = context_layer_5_transpose_y_0, x = input_35, y = value_layer_3)[name = tensor("context_layer_5")]; tensor var_214 = const()[name = tensor("op_214"), val = tensor([0, 2, 1, 3])]; tensor var_219 = const()[name = tensor("op_219"), val = tensor([1, 512, 768])]; tensor var_215 = transpose(perm = var_214, x = context_layer_5)[name = tensor("transpose_100")]; tensor input_37 = reshape(shape = var_219, x = var_215)[name = tensor("input_37")]; tensor input_39 = linear(bias = text_branch_encoder_layer_1_attention_output_dense_bias, weight = text_branch_encoder_layer_1_attention_output_dense_weight, x = input_37)[name = tensor("linear_9")]; tensor input_41 = add(x = input_39, y = input_31)[name = tensor("input_41")]; tensor input_43_axes_0 = const()[name = tensor("input_43_axes_0"), val = tensor([-1])]; tensor input_43 = layer_norm(axes = input_43_axes_0, beta = text_branch_encoder_layer_1_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_1_attention_output_LayerNorm_weight, x = input_41)[name = tensor("input_43")]; tensor input_45 = linear(bias = text_branch_encoder_layer_1_intermediate_dense_bias, weight = text_branch_encoder_layer_1_intermediate_dense_weight, x = input_43)[name = tensor("linear_10")]; tensor input_47_mode_0 = const()[name = tensor("input_47_mode_0"), val = tensor("EXACT")]; tensor input_47 = gelu(mode = input_47_mode_0, x = input_45)[name = tensor("input_47")]; tensor input_49 = linear(bias = text_branch_encoder_layer_1_output_dense_bias, weight = text_branch_encoder_layer_1_output_dense_weight, x = input_47)[name = tensor("linear_11")]; tensor input_51 = add(x = input_49, y = input_43)[name = tensor("input_51")]; tensor input_53_axes_0 = const()[name = tensor("input_53_axes_0"), val = tensor([-1])]; tensor input_53 = layer_norm(axes = input_53_axes_0, beta = text_branch_encoder_layer_1_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_1_output_LayerNorm_weight, x = input_51)[name = tensor("input_53")]; tensor x_33 = linear(bias = text_branch_encoder_layer_2_attention_self_query_bias, weight = text_branch_encoder_layer_2_attention_self_query_weight, x = input_53)[name = tensor("linear_12")]; tensor x_25 = linear(bias = text_branch_encoder_layer_2_attention_self_key_bias, weight = text_branch_encoder_layer_2_attention_self_key_weight, x = input_53)[name = tensor("linear_13")]; tensor var_264 = const()[name = tensor("op_264"), val = tensor([1, 512, 12, 64])]; tensor x_27 = reshape(shape = var_264, x = x_25)[name = tensor("x_27")]; tensor x_29 = linear(bias = text_branch_encoder_layer_2_attention_self_value_bias, weight = text_branch_encoder_layer_2_attention_self_value_weight, x = input_53)[name = tensor("linear_14")]; tensor var_273 = const()[name = tensor("op_273"), val = tensor([1, 512, 12, 64])]; tensor x_31 = reshape(shape = var_273, x = x_29)[name = tensor("x_31")]; tensor var_275 = const()[name = tensor("op_275"), val = tensor([0, 2, 1, 3])]; tensor var_279 = const()[name = tensor("op_279"), val = tensor([1, 512, 12, 64])]; tensor x_35 = reshape(shape = var_279, x = x_33)[name = tensor("x_35")]; tensor attention_scores_9_transpose_x_0 = const()[name = tensor("attention_scores_9_transpose_x_0"), val = tensor(false)]; tensor attention_scores_9_transpose_y_0 = const()[name = tensor("attention_scores_9_transpose_y_0"), val = tensor(false)]; tensor transpose_40_perm_0 = const()[name = tensor("transpose_40_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_41_perm_0 = const()[name = tensor("transpose_41_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_41 = transpose(perm = transpose_41_perm_0, x = x_27)[name = tensor("transpose_97")]; tensor transpose_40 = transpose(perm = transpose_40_perm_0, x = x_35)[name = tensor("transpose_98")]; tensor attention_scores_9 = matmul(transpose_x = attention_scores_9_transpose_x_0, transpose_y = attention_scores_9_transpose_y_0, x = transpose_40, y = transpose_41)[name = tensor("attention_scores_9")]; tensor _inversed_attention_scores_11_y_0 = const()[name = tensor("_inversed_attention_scores_11_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_11 = mul(x = attention_scores_9, y = _inversed_attention_scores_11_y_0)[name = tensor("_inversed_attention_scores_11")]; tensor input_55 = add(x = _inversed_attention_scores_11, y = attention_mask_1)[name = tensor("input_55")]; tensor input_57 = softmax(axis = var_10, x = input_55)[name = tensor("input_57")]; tensor context_layer_9_transpose_x_0 = const()[name = tensor("context_layer_9_transpose_x_0"), val = tensor(false)]; tensor context_layer_9_transpose_y_0 = const()[name = tensor("context_layer_9_transpose_y_0"), val = tensor(false)]; tensor value_layer_5 = transpose(perm = var_275, x = x_31)[name = tensor("transpose_99")]; tensor context_layer_9 = matmul(transpose_x = context_layer_9_transpose_x_0, transpose_y = context_layer_9_transpose_y_0, x = input_57, y = value_layer_5)[name = tensor("context_layer_9")]; tensor var_291 = const()[name = tensor("op_291"), val = tensor([0, 2, 1, 3])]; tensor var_296 = const()[name = tensor("op_296"), val = tensor([1, 512, 768])]; tensor var_292 = transpose(perm = var_291, x = context_layer_9)[name = tensor("transpose_96")]; tensor input_59 = reshape(shape = var_296, x = var_292)[name = tensor("input_59")]; tensor input_61 = linear(bias = text_branch_encoder_layer_2_attention_output_dense_bias, weight = text_branch_encoder_layer_2_attention_output_dense_weight, x = input_59)[name = tensor("linear_15")]; tensor input_63 = add(x = input_61, y = input_53)[name = tensor("input_63")]; tensor input_65_axes_0 = const()[name = tensor("input_65_axes_0"), val = tensor([-1])]; tensor input_65 = layer_norm(axes = input_65_axes_0, beta = text_branch_encoder_layer_2_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_2_attention_output_LayerNorm_weight, x = input_63)[name = tensor("input_65")]; tensor input_67 = linear(bias = text_branch_encoder_layer_2_intermediate_dense_bias, weight = text_branch_encoder_layer_2_intermediate_dense_weight, x = input_65)[name = tensor("linear_16")]; tensor input_69_mode_0 = const()[name = tensor("input_69_mode_0"), val = tensor("EXACT")]; tensor input_69 = gelu(mode = input_69_mode_0, x = input_67)[name = tensor("input_69")]; tensor input_71 = linear(bias = text_branch_encoder_layer_2_output_dense_bias, weight = text_branch_encoder_layer_2_output_dense_weight, x = input_69)[name = tensor("linear_17")]; tensor input_73 = add(x = input_71, y = input_65)[name = tensor("input_73")]; tensor input_75_axes_0 = const()[name = tensor("input_75_axes_0"), val = tensor([-1])]; tensor input_75 = layer_norm(axes = input_75_axes_0, beta = text_branch_encoder_layer_2_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_2_output_LayerNorm_weight, x = input_73)[name = tensor("input_75")]; tensor x_45 = linear(bias = text_branch_encoder_layer_3_attention_self_query_bias, weight = text_branch_encoder_layer_3_attention_self_query_weight, x = input_75)[name = tensor("linear_18")]; tensor x_37 = linear(bias = text_branch_encoder_layer_3_attention_self_key_bias, weight = text_branch_encoder_layer_3_attention_self_key_weight, x = input_75)[name = tensor("linear_19")]; tensor var_341 = const()[name = tensor("op_341"), val = tensor([1, 512, 12, 64])]; tensor x_39 = reshape(shape = var_341, x = x_37)[name = tensor("x_39")]; tensor x_41 = linear(bias = text_branch_encoder_layer_3_attention_self_value_bias, weight = text_branch_encoder_layer_3_attention_self_value_weight, x = input_75)[name = tensor("linear_20")]; tensor var_350 = const()[name = tensor("op_350"), val = tensor([1, 512, 12, 64])]; tensor x_43 = reshape(shape = var_350, x = x_41)[name = tensor("x_43")]; tensor var_352 = const()[name = tensor("op_352"), val = tensor([0, 2, 1, 3])]; tensor var_356 = const()[name = tensor("op_356"), val = tensor([1, 512, 12, 64])]; tensor x_47 = reshape(shape = var_356, x = x_45)[name = tensor("x_47")]; tensor attention_scores_13_transpose_x_0 = const()[name = tensor("attention_scores_13_transpose_x_0"), val = tensor(false)]; tensor attention_scores_13_transpose_y_0 = const()[name = tensor("attention_scores_13_transpose_y_0"), val = tensor(false)]; tensor transpose_42_perm_0 = const()[name = tensor("transpose_42_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_43_perm_0 = const()[name = tensor("transpose_43_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_43 = transpose(perm = transpose_43_perm_0, x = x_39)[name = tensor("transpose_93")]; tensor transpose_42 = transpose(perm = transpose_42_perm_0, x = x_47)[name = tensor("transpose_94")]; tensor attention_scores_13 = matmul(transpose_x = attention_scores_13_transpose_x_0, transpose_y = attention_scores_13_transpose_y_0, x = transpose_42, y = transpose_43)[name = tensor("attention_scores_13")]; tensor _inversed_attention_scores_15_y_0 = const()[name = tensor("_inversed_attention_scores_15_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_15 = mul(x = attention_scores_13, y = _inversed_attention_scores_15_y_0)[name = tensor("_inversed_attention_scores_15")]; tensor input_77 = add(x = _inversed_attention_scores_15, y = attention_mask_1)[name = tensor("input_77")]; tensor input_79 = softmax(axis = var_10, x = input_77)[name = tensor("input_79")]; tensor context_layer_13_transpose_x_0 = const()[name = tensor("context_layer_13_transpose_x_0"), val = tensor(false)]; tensor context_layer_13_transpose_y_0 = const()[name = tensor("context_layer_13_transpose_y_0"), val = tensor(false)]; tensor value_layer_7 = transpose(perm = var_352, x = x_43)[name = tensor("transpose_95")]; tensor context_layer_13 = matmul(transpose_x = context_layer_13_transpose_x_0, transpose_y = context_layer_13_transpose_y_0, x = input_79, y = value_layer_7)[name = tensor("context_layer_13")]; tensor var_368 = const()[name = tensor("op_368"), val = tensor([0, 2, 1, 3])]; tensor var_373 = const()[name = tensor("op_373"), val = tensor([1, 512, 768])]; tensor var_369 = transpose(perm = var_368, x = context_layer_13)[name = tensor("transpose_92")]; tensor input_81 = reshape(shape = var_373, x = var_369)[name = tensor("input_81")]; tensor input_83 = linear(bias = text_branch_encoder_layer_3_attention_output_dense_bias, weight = text_branch_encoder_layer_3_attention_output_dense_weight, x = input_81)[name = tensor("linear_21")]; tensor input_85 = add(x = input_83, y = input_75)[name = tensor("input_85")]; tensor input_87_axes_0 = const()[name = tensor("input_87_axes_0"), val = tensor([-1])]; tensor input_87 = layer_norm(axes = input_87_axes_0, beta = text_branch_encoder_layer_3_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_3_attention_output_LayerNorm_weight, x = input_85)[name = tensor("input_87")]; tensor input_89 = linear(bias = text_branch_encoder_layer_3_intermediate_dense_bias, weight = text_branch_encoder_layer_3_intermediate_dense_weight, x = input_87)[name = tensor("linear_22")]; tensor input_91_mode_0 = const()[name = tensor("input_91_mode_0"), val = tensor("EXACT")]; tensor input_91 = gelu(mode = input_91_mode_0, x = input_89)[name = tensor("input_91")]; tensor input_93 = linear(bias = text_branch_encoder_layer_3_output_dense_bias, weight = text_branch_encoder_layer_3_output_dense_weight, x = input_91)[name = tensor("linear_23")]; tensor input_95 = add(x = input_93, y = input_87)[name = tensor("input_95")]; tensor input_97_axes_0 = const()[name = tensor("input_97_axes_0"), val = tensor([-1])]; tensor input_97 = layer_norm(axes = input_97_axes_0, beta = text_branch_encoder_layer_3_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_3_output_LayerNorm_weight, x = input_95)[name = tensor("input_97")]; tensor x_57 = linear(bias = text_branch_encoder_layer_4_attention_self_query_bias, weight = text_branch_encoder_layer_4_attention_self_query_weight, x = input_97)[name = tensor("linear_24")]; tensor x_49 = linear(bias = text_branch_encoder_layer_4_attention_self_key_bias, weight = text_branch_encoder_layer_4_attention_self_key_weight, x = input_97)[name = tensor("linear_25")]; tensor var_418 = const()[name = tensor("op_418"), val = tensor([1, 512, 12, 64])]; tensor x_51 = reshape(shape = var_418, x = x_49)[name = tensor("x_51")]; tensor x_53 = linear(bias = text_branch_encoder_layer_4_attention_self_value_bias, weight = text_branch_encoder_layer_4_attention_self_value_weight, x = input_97)[name = tensor("linear_26")]; tensor var_427 = const()[name = tensor("op_427"), val = tensor([1, 512, 12, 64])]; tensor x_55 = reshape(shape = var_427, x = x_53)[name = tensor("x_55")]; tensor var_429 = const()[name = tensor("op_429"), val = tensor([0, 2, 1, 3])]; tensor var_433 = const()[name = tensor("op_433"), val = tensor([1, 512, 12, 64])]; tensor x_59 = reshape(shape = var_433, x = x_57)[name = tensor("x_59")]; tensor attention_scores_17_transpose_x_0 = const()[name = tensor("attention_scores_17_transpose_x_0"), val = tensor(false)]; tensor attention_scores_17_transpose_y_0 = const()[name = tensor("attention_scores_17_transpose_y_0"), val = tensor(false)]; tensor transpose_44_perm_0 = const()[name = tensor("transpose_44_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_45_perm_0 = const()[name = tensor("transpose_45_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_45 = transpose(perm = transpose_45_perm_0, x = x_51)[name = tensor("transpose_89")]; tensor transpose_44 = transpose(perm = transpose_44_perm_0, x = x_59)[name = tensor("transpose_90")]; tensor attention_scores_17 = matmul(transpose_x = attention_scores_17_transpose_x_0, transpose_y = attention_scores_17_transpose_y_0, x = transpose_44, y = transpose_45)[name = tensor("attention_scores_17")]; tensor _inversed_attention_scores_19_y_0 = const()[name = tensor("_inversed_attention_scores_19_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_19 = mul(x = attention_scores_17, y = _inversed_attention_scores_19_y_0)[name = tensor("_inversed_attention_scores_19")]; tensor input_99 = add(x = _inversed_attention_scores_19, y = attention_mask_1)[name = tensor("input_99")]; tensor input_101 = softmax(axis = var_10, x = input_99)[name = tensor("input_101")]; tensor context_layer_17_transpose_x_0 = const()[name = tensor("context_layer_17_transpose_x_0"), val = tensor(false)]; tensor context_layer_17_transpose_y_0 = const()[name = tensor("context_layer_17_transpose_y_0"), val = tensor(false)]; tensor value_layer_9 = transpose(perm = var_429, x = x_55)[name = tensor("transpose_91")]; tensor context_layer_17 = matmul(transpose_x = context_layer_17_transpose_x_0, transpose_y = context_layer_17_transpose_y_0, x = input_101, y = value_layer_9)[name = tensor("context_layer_17")]; tensor var_445 = const()[name = tensor("op_445"), val = tensor([0, 2, 1, 3])]; tensor var_450 = const()[name = tensor("op_450"), val = tensor([1, 512, 768])]; tensor var_446 = transpose(perm = var_445, x = context_layer_17)[name = tensor("transpose_88")]; tensor input_103 = reshape(shape = var_450, x = var_446)[name = tensor("input_103")]; tensor input_105 = linear(bias = text_branch_encoder_layer_4_attention_output_dense_bias, weight = text_branch_encoder_layer_4_attention_output_dense_weight, x = input_103)[name = tensor("linear_27")]; tensor input_107 = add(x = input_105, y = input_97)[name = tensor("input_107")]; tensor input_109_axes_0 = const()[name = tensor("input_109_axes_0"), val = tensor([-1])]; tensor input_109 = layer_norm(axes = input_109_axes_0, beta = text_branch_encoder_layer_4_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_4_attention_output_LayerNorm_weight, x = input_107)[name = tensor("input_109")]; tensor input_111 = linear(bias = text_branch_encoder_layer_4_intermediate_dense_bias, weight = text_branch_encoder_layer_4_intermediate_dense_weight, x = input_109)[name = tensor("linear_28")]; tensor input_113_mode_0 = const()[name = tensor("input_113_mode_0"), val = tensor("EXACT")]; tensor input_113 = gelu(mode = input_113_mode_0, x = input_111)[name = tensor("input_113")]; tensor input_115 = linear(bias = text_branch_encoder_layer_4_output_dense_bias, weight = text_branch_encoder_layer_4_output_dense_weight, x = input_113)[name = tensor("linear_29")]; tensor input_117 = add(x = input_115, y = input_109)[name = tensor("input_117")]; tensor input_119_axes_0 = const()[name = tensor("input_119_axes_0"), val = tensor([-1])]; tensor input_119 = layer_norm(axes = input_119_axes_0, beta = text_branch_encoder_layer_4_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_4_output_LayerNorm_weight, x = input_117)[name = tensor("input_119")]; tensor x_69 = linear(bias = text_branch_encoder_layer_5_attention_self_query_bias, weight = text_branch_encoder_layer_5_attention_self_query_weight, x = input_119)[name = tensor("linear_30")]; tensor x_61 = linear(bias = text_branch_encoder_layer_5_attention_self_key_bias, weight = text_branch_encoder_layer_5_attention_self_key_weight, x = input_119)[name = tensor("linear_31")]; tensor var_495 = const()[name = tensor("op_495"), val = tensor([1, 512, 12, 64])]; tensor x_63 = reshape(shape = var_495, x = x_61)[name = tensor("x_63")]; tensor x_65 = linear(bias = text_branch_encoder_layer_5_attention_self_value_bias, weight = text_branch_encoder_layer_5_attention_self_value_weight, x = input_119)[name = tensor("linear_32")]; tensor var_504 = const()[name = tensor("op_504"), val = tensor([1, 512, 12, 64])]; tensor x_67 = reshape(shape = var_504, x = x_65)[name = tensor("x_67")]; tensor var_506 = const()[name = tensor("op_506"), val = tensor([0, 2, 1, 3])]; tensor var_510 = const()[name = tensor("op_510"), val = tensor([1, 512, 12, 64])]; tensor x_71 = reshape(shape = var_510, x = x_69)[name = tensor("x_71")]; tensor attention_scores_21_transpose_x_0 = const()[name = tensor("attention_scores_21_transpose_x_0"), val = tensor(false)]; tensor attention_scores_21_transpose_y_0 = const()[name = tensor("attention_scores_21_transpose_y_0"), val = tensor(false)]; tensor transpose_46_perm_0 = const()[name = tensor("transpose_46_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_47_perm_0 = const()[name = tensor("transpose_47_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_47 = transpose(perm = transpose_47_perm_0, x = x_63)[name = tensor("transpose_85")]; tensor transpose_46 = transpose(perm = transpose_46_perm_0, x = x_71)[name = tensor("transpose_86")]; tensor attention_scores_21 = matmul(transpose_x = attention_scores_21_transpose_x_0, transpose_y = attention_scores_21_transpose_y_0, x = transpose_46, y = transpose_47)[name = tensor("attention_scores_21")]; tensor _inversed_attention_scores_23_y_0 = const()[name = tensor("_inversed_attention_scores_23_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_23 = mul(x = attention_scores_21, y = _inversed_attention_scores_23_y_0)[name = tensor("_inversed_attention_scores_23")]; tensor input_121 = add(x = _inversed_attention_scores_23, y = attention_mask_1)[name = tensor("input_121")]; tensor input_123 = softmax(axis = var_10, x = input_121)[name = tensor("input_123")]; tensor context_layer_21_transpose_x_0 = const()[name = tensor("context_layer_21_transpose_x_0"), val = tensor(false)]; tensor context_layer_21_transpose_y_0 = const()[name = tensor("context_layer_21_transpose_y_0"), val = tensor(false)]; tensor value_layer_11 = transpose(perm = var_506, x = x_67)[name = tensor("transpose_87")]; tensor context_layer_21 = matmul(transpose_x = context_layer_21_transpose_x_0, transpose_y = context_layer_21_transpose_y_0, x = input_123, y = value_layer_11)[name = tensor("context_layer_21")]; tensor var_522 = const()[name = tensor("op_522"), val = tensor([0, 2, 1, 3])]; tensor var_527 = const()[name = tensor("op_527"), val = tensor([1, 512, 768])]; tensor var_523 = transpose(perm = var_522, x = context_layer_21)[name = tensor("transpose_84")]; tensor input_125 = reshape(shape = var_527, x = var_523)[name = tensor("input_125")]; tensor input_127 = linear(bias = text_branch_encoder_layer_5_attention_output_dense_bias, weight = text_branch_encoder_layer_5_attention_output_dense_weight, x = input_125)[name = tensor("linear_33")]; tensor input_129 = add(x = input_127, y = input_119)[name = tensor("input_129")]; tensor input_131_axes_0 = const()[name = tensor("input_131_axes_0"), val = tensor([-1])]; tensor input_131 = layer_norm(axes = input_131_axes_0, beta = text_branch_encoder_layer_5_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_5_attention_output_LayerNorm_weight, x = input_129)[name = tensor("input_131")]; tensor input_133 = linear(bias = text_branch_encoder_layer_5_intermediate_dense_bias, weight = text_branch_encoder_layer_5_intermediate_dense_weight, x = input_131)[name = tensor("linear_34")]; tensor input_135_mode_0 = const()[name = tensor("input_135_mode_0"), val = tensor("EXACT")]; tensor input_135 = gelu(mode = input_135_mode_0, x = input_133)[name = tensor("input_135")]; tensor input_137 = linear(bias = text_branch_encoder_layer_5_output_dense_bias, weight = text_branch_encoder_layer_5_output_dense_weight, x = input_135)[name = tensor("linear_35")]; tensor input_139 = add(x = input_137, y = input_131)[name = tensor("input_139")]; tensor input_141_axes_0 = const()[name = tensor("input_141_axes_0"), val = tensor([-1])]; tensor input_141 = layer_norm(axes = input_141_axes_0, beta = text_branch_encoder_layer_5_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_5_output_LayerNorm_weight, x = input_139)[name = tensor("input_141")]; tensor x_81 = linear(bias = text_branch_encoder_layer_6_attention_self_query_bias, weight = text_branch_encoder_layer_6_attention_self_query_weight, x = input_141)[name = tensor("linear_36")]; tensor x_73 = linear(bias = text_branch_encoder_layer_6_attention_self_key_bias, weight = text_branch_encoder_layer_6_attention_self_key_weight, x = input_141)[name = tensor("linear_37")]; tensor var_572 = const()[name = tensor("op_572"), val = tensor([1, 512, 12, 64])]; tensor x_75 = reshape(shape = var_572, x = x_73)[name = tensor("x_75")]; tensor x_77 = linear(bias = text_branch_encoder_layer_6_attention_self_value_bias, weight = text_branch_encoder_layer_6_attention_self_value_weight, x = input_141)[name = tensor("linear_38")]; tensor var_581 = const()[name = tensor("op_581"), val = tensor([1, 512, 12, 64])]; tensor x_79 = reshape(shape = var_581, x = x_77)[name = tensor("x_79")]; tensor var_583 = const()[name = tensor("op_583"), val = tensor([0, 2, 1, 3])]; tensor var_587 = const()[name = tensor("op_587"), val = tensor([1, 512, 12, 64])]; tensor x_83 = reshape(shape = var_587, x = x_81)[name = tensor("x_83")]; tensor attention_scores_25_transpose_x_0 = const()[name = tensor("attention_scores_25_transpose_x_0"), val = tensor(false)]; tensor attention_scores_25_transpose_y_0 = const()[name = tensor("attention_scores_25_transpose_y_0"), val = tensor(false)]; tensor transpose_48_perm_0 = const()[name = tensor("transpose_48_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_49_perm_0 = const()[name = tensor("transpose_49_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_49 = transpose(perm = transpose_49_perm_0, x = x_75)[name = tensor("transpose_81")]; tensor transpose_48 = transpose(perm = transpose_48_perm_0, x = x_83)[name = tensor("transpose_82")]; tensor attention_scores_25 = matmul(transpose_x = attention_scores_25_transpose_x_0, transpose_y = attention_scores_25_transpose_y_0, x = transpose_48, y = transpose_49)[name = tensor("attention_scores_25")]; tensor _inversed_attention_scores_27_y_0 = const()[name = tensor("_inversed_attention_scores_27_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_27 = mul(x = attention_scores_25, y = _inversed_attention_scores_27_y_0)[name = tensor("_inversed_attention_scores_27")]; tensor input_143 = add(x = _inversed_attention_scores_27, y = attention_mask_1)[name = tensor("input_143")]; tensor input_145 = softmax(axis = var_10, x = input_143)[name = tensor("input_145")]; tensor context_layer_25_transpose_x_0 = const()[name = tensor("context_layer_25_transpose_x_0"), val = tensor(false)]; tensor context_layer_25_transpose_y_0 = const()[name = tensor("context_layer_25_transpose_y_0"), val = tensor(false)]; tensor value_layer_13 = transpose(perm = var_583, x = x_79)[name = tensor("transpose_83")]; tensor context_layer_25 = matmul(transpose_x = context_layer_25_transpose_x_0, transpose_y = context_layer_25_transpose_y_0, x = input_145, y = value_layer_13)[name = tensor("context_layer_25")]; tensor var_599 = const()[name = tensor("op_599"), val = tensor([0, 2, 1, 3])]; tensor var_604 = const()[name = tensor("op_604"), val = tensor([1, 512, 768])]; tensor var_600 = transpose(perm = var_599, x = context_layer_25)[name = tensor("transpose_80")]; tensor input_147 = reshape(shape = var_604, x = var_600)[name = tensor("input_147")]; tensor input_149 = linear(bias = text_branch_encoder_layer_6_attention_output_dense_bias, weight = text_branch_encoder_layer_6_attention_output_dense_weight, x = input_147)[name = tensor("linear_39")]; tensor input_151 = add(x = input_149, y = input_141)[name = tensor("input_151")]; tensor input_153_axes_0 = const()[name = tensor("input_153_axes_0"), val = tensor([-1])]; tensor input_153 = layer_norm(axes = input_153_axes_0, beta = text_branch_encoder_layer_6_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_6_attention_output_LayerNorm_weight, x = input_151)[name = tensor("input_153")]; tensor input_155 = linear(bias = text_branch_encoder_layer_6_intermediate_dense_bias, weight = text_branch_encoder_layer_6_intermediate_dense_weight, x = input_153)[name = tensor("linear_40")]; tensor input_157_mode_0 = const()[name = tensor("input_157_mode_0"), val = tensor("EXACT")]; tensor input_157 = gelu(mode = input_157_mode_0, x = input_155)[name = tensor("input_157")]; tensor input_159 = linear(bias = text_branch_encoder_layer_6_output_dense_bias, weight = text_branch_encoder_layer_6_output_dense_weight, x = input_157)[name = tensor("linear_41")]; tensor input_161 = add(x = input_159, y = input_153)[name = tensor("input_161")]; tensor input_163_axes_0 = const()[name = tensor("input_163_axes_0"), val = tensor([-1])]; tensor input_163 = layer_norm(axes = input_163_axes_0, beta = text_branch_encoder_layer_6_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_6_output_LayerNorm_weight, x = input_161)[name = tensor("input_163")]; tensor x_93 = linear(bias = text_branch_encoder_layer_7_attention_self_query_bias, weight = text_branch_encoder_layer_7_attention_self_query_weight, x = input_163)[name = tensor("linear_42")]; tensor x_85 = linear(bias = text_branch_encoder_layer_7_attention_self_key_bias, weight = text_branch_encoder_layer_7_attention_self_key_weight, x = input_163)[name = tensor("linear_43")]; tensor var_649 = const()[name = tensor("op_649"), val = tensor([1, 512, 12, 64])]; tensor x_87 = reshape(shape = var_649, x = x_85)[name = tensor("x_87")]; tensor x_89 = linear(bias = text_branch_encoder_layer_7_attention_self_value_bias, weight = text_branch_encoder_layer_7_attention_self_value_weight, x = input_163)[name = tensor("linear_44")]; tensor var_658 = const()[name = tensor("op_658"), val = tensor([1, 512, 12, 64])]; tensor x_91 = reshape(shape = var_658, x = x_89)[name = tensor("x_91")]; tensor var_660 = const()[name = tensor("op_660"), val = tensor([0, 2, 1, 3])]; tensor var_664 = const()[name = tensor("op_664"), val = tensor([1, 512, 12, 64])]; tensor x_95 = reshape(shape = var_664, x = x_93)[name = tensor("x_95")]; tensor attention_scores_29_transpose_x_0 = const()[name = tensor("attention_scores_29_transpose_x_0"), val = tensor(false)]; tensor attention_scores_29_transpose_y_0 = const()[name = tensor("attention_scores_29_transpose_y_0"), val = tensor(false)]; tensor transpose_50_perm_0 = const()[name = tensor("transpose_50_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_51_perm_0 = const()[name = tensor("transpose_51_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_51 = transpose(perm = transpose_51_perm_0, x = x_87)[name = tensor("transpose_77")]; tensor transpose_50 = transpose(perm = transpose_50_perm_0, x = x_95)[name = tensor("transpose_78")]; tensor attention_scores_29 = matmul(transpose_x = attention_scores_29_transpose_x_0, transpose_y = attention_scores_29_transpose_y_0, x = transpose_50, y = transpose_51)[name = tensor("attention_scores_29")]; tensor _inversed_attention_scores_31_y_0 = const()[name = tensor("_inversed_attention_scores_31_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_31 = mul(x = attention_scores_29, y = _inversed_attention_scores_31_y_0)[name = tensor("_inversed_attention_scores_31")]; tensor input_165 = add(x = _inversed_attention_scores_31, y = attention_mask_1)[name = tensor("input_165")]; tensor input_167 = softmax(axis = var_10, x = input_165)[name = tensor("input_167")]; tensor context_layer_29_transpose_x_0 = const()[name = tensor("context_layer_29_transpose_x_0"), val = tensor(false)]; tensor context_layer_29_transpose_y_0 = const()[name = tensor("context_layer_29_transpose_y_0"), val = tensor(false)]; tensor value_layer_15 = transpose(perm = var_660, x = x_91)[name = tensor("transpose_79")]; tensor context_layer_29 = matmul(transpose_x = context_layer_29_transpose_x_0, transpose_y = context_layer_29_transpose_y_0, x = input_167, y = value_layer_15)[name = tensor("context_layer_29")]; tensor var_676 = const()[name = tensor("op_676"), val = tensor([0, 2, 1, 3])]; tensor var_681 = const()[name = tensor("op_681"), val = tensor([1, 512, 768])]; tensor var_677 = transpose(perm = var_676, x = context_layer_29)[name = tensor("transpose_76")]; tensor input_169 = reshape(shape = var_681, x = var_677)[name = tensor("input_169")]; tensor input_171 = linear(bias = text_branch_encoder_layer_7_attention_output_dense_bias, weight = text_branch_encoder_layer_7_attention_output_dense_weight, x = input_169)[name = tensor("linear_45")]; tensor input_173 = add(x = input_171, y = input_163)[name = tensor("input_173")]; tensor input_175_axes_0 = const()[name = tensor("input_175_axes_0"), val = tensor([-1])]; tensor input_175 = layer_norm(axes = input_175_axes_0, beta = text_branch_encoder_layer_7_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_7_attention_output_LayerNorm_weight, x = input_173)[name = tensor("input_175")]; tensor input_177 = linear(bias = text_branch_encoder_layer_7_intermediate_dense_bias, weight = text_branch_encoder_layer_7_intermediate_dense_weight, x = input_175)[name = tensor("linear_46")]; tensor input_179_mode_0 = const()[name = tensor("input_179_mode_0"), val = tensor("EXACT")]; tensor input_179 = gelu(mode = input_179_mode_0, x = input_177)[name = tensor("input_179")]; tensor input_181 = linear(bias = text_branch_encoder_layer_7_output_dense_bias, weight = text_branch_encoder_layer_7_output_dense_weight, x = input_179)[name = tensor("linear_47")]; tensor input_183 = add(x = input_181, y = input_175)[name = tensor("input_183")]; tensor input_185_axes_0 = const()[name = tensor("input_185_axes_0"), val = tensor([-1])]; tensor input_185 = layer_norm(axes = input_185_axes_0, beta = text_branch_encoder_layer_7_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_7_output_LayerNorm_weight, x = input_183)[name = tensor("input_185")]; tensor x_105 = linear(bias = text_branch_encoder_layer_8_attention_self_query_bias, weight = text_branch_encoder_layer_8_attention_self_query_weight, x = input_185)[name = tensor("linear_48")]; tensor x_97 = linear(bias = text_branch_encoder_layer_8_attention_self_key_bias, weight = text_branch_encoder_layer_8_attention_self_key_weight, x = input_185)[name = tensor("linear_49")]; tensor var_726 = const()[name = tensor("op_726"), val = tensor([1, 512, 12, 64])]; tensor x_99 = reshape(shape = var_726, x = x_97)[name = tensor("x_99")]; tensor x_101 = linear(bias = text_branch_encoder_layer_8_attention_self_value_bias, weight = text_branch_encoder_layer_8_attention_self_value_weight, x = input_185)[name = tensor("linear_50")]; tensor var_735 = const()[name = tensor("op_735"), val = tensor([1, 512, 12, 64])]; tensor x_103 = reshape(shape = var_735, x = x_101)[name = tensor("x_103")]; tensor var_737 = const()[name = tensor("op_737"), val = tensor([0, 2, 1, 3])]; tensor var_741 = const()[name = tensor("op_741"), val = tensor([1, 512, 12, 64])]; tensor x_107 = reshape(shape = var_741, x = x_105)[name = tensor("x_107")]; tensor attention_scores_33_transpose_x_0 = const()[name = tensor("attention_scores_33_transpose_x_0"), val = tensor(false)]; tensor attention_scores_33_transpose_y_0 = const()[name = tensor("attention_scores_33_transpose_y_0"), val = tensor(false)]; tensor transpose_52_perm_0 = const()[name = tensor("transpose_52_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_53_perm_0 = const()[name = tensor("transpose_53_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_53 = transpose(perm = transpose_53_perm_0, x = x_99)[name = tensor("transpose_73")]; tensor transpose_52 = transpose(perm = transpose_52_perm_0, x = x_107)[name = tensor("transpose_74")]; tensor attention_scores_33 = matmul(transpose_x = attention_scores_33_transpose_x_0, transpose_y = attention_scores_33_transpose_y_0, x = transpose_52, y = transpose_53)[name = tensor("attention_scores_33")]; tensor _inversed_attention_scores_35_y_0 = const()[name = tensor("_inversed_attention_scores_35_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_35 = mul(x = attention_scores_33, y = _inversed_attention_scores_35_y_0)[name = tensor("_inversed_attention_scores_35")]; tensor input_187 = add(x = _inversed_attention_scores_35, y = attention_mask_1)[name = tensor("input_187")]; tensor input_189 = softmax(axis = var_10, x = input_187)[name = tensor("input_189")]; tensor context_layer_33_transpose_x_0 = const()[name = tensor("context_layer_33_transpose_x_0"), val = tensor(false)]; tensor context_layer_33_transpose_y_0 = const()[name = tensor("context_layer_33_transpose_y_0"), val = tensor(false)]; tensor value_layer_17 = transpose(perm = var_737, x = x_103)[name = tensor("transpose_75")]; tensor context_layer_33 = matmul(transpose_x = context_layer_33_transpose_x_0, transpose_y = context_layer_33_transpose_y_0, x = input_189, y = value_layer_17)[name = tensor("context_layer_33")]; tensor var_753 = const()[name = tensor("op_753"), val = tensor([0, 2, 1, 3])]; tensor var_758 = const()[name = tensor("op_758"), val = tensor([1, 512, 768])]; tensor var_754 = transpose(perm = var_753, x = context_layer_33)[name = tensor("transpose_72")]; tensor input_191 = reshape(shape = var_758, x = var_754)[name = tensor("input_191")]; tensor input_193 = linear(bias = text_branch_encoder_layer_8_attention_output_dense_bias, weight = text_branch_encoder_layer_8_attention_output_dense_weight, x = input_191)[name = tensor("linear_51")]; tensor input_195 = add(x = input_193, y = input_185)[name = tensor("input_195")]; tensor input_197_axes_0 = const()[name = tensor("input_197_axes_0"), val = tensor([-1])]; tensor input_197 = layer_norm(axes = input_197_axes_0, beta = text_branch_encoder_layer_8_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_8_attention_output_LayerNorm_weight, x = input_195)[name = tensor("input_197")]; tensor input_199 = linear(bias = text_branch_encoder_layer_8_intermediate_dense_bias, weight = text_branch_encoder_layer_8_intermediate_dense_weight, x = input_197)[name = tensor("linear_52")]; tensor input_201_mode_0 = const()[name = tensor("input_201_mode_0"), val = tensor("EXACT")]; tensor input_201 = gelu(mode = input_201_mode_0, x = input_199)[name = tensor("input_201")]; tensor input_203 = linear(bias = text_branch_encoder_layer_8_output_dense_bias, weight = text_branch_encoder_layer_8_output_dense_weight, x = input_201)[name = tensor("linear_53")]; tensor input_205 = add(x = input_203, y = input_197)[name = tensor("input_205")]; tensor input_207_axes_0 = const()[name = tensor("input_207_axes_0"), val = tensor([-1])]; tensor input_207 = layer_norm(axes = input_207_axes_0, beta = text_branch_encoder_layer_8_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_8_output_LayerNorm_weight, x = input_205)[name = tensor("input_207")]; tensor x_117 = linear(bias = text_branch_encoder_layer_9_attention_self_query_bias, weight = text_branch_encoder_layer_9_attention_self_query_weight, x = input_207)[name = tensor("linear_54")]; tensor x_109 = linear(bias = text_branch_encoder_layer_9_attention_self_key_bias, weight = text_branch_encoder_layer_9_attention_self_key_weight, x = input_207)[name = tensor("linear_55")]; tensor var_803 = const()[name = tensor("op_803"), val = tensor([1, 512, 12, 64])]; tensor x_111 = reshape(shape = var_803, x = x_109)[name = tensor("x_111")]; tensor x_113 = linear(bias = text_branch_encoder_layer_9_attention_self_value_bias, weight = text_branch_encoder_layer_9_attention_self_value_weight, x = input_207)[name = tensor("linear_56")]; tensor var_812 = const()[name = tensor("op_812"), val = tensor([1, 512, 12, 64])]; tensor x_115 = reshape(shape = var_812, x = x_113)[name = tensor("x_115")]; tensor var_814 = const()[name = tensor("op_814"), val = tensor([0, 2, 1, 3])]; tensor var_818 = const()[name = tensor("op_818"), val = tensor([1, 512, 12, 64])]; tensor x_119 = reshape(shape = var_818, x = x_117)[name = tensor("x_119")]; tensor attention_scores_37_transpose_x_0 = const()[name = tensor("attention_scores_37_transpose_x_0"), val = tensor(false)]; tensor attention_scores_37_transpose_y_0 = const()[name = tensor("attention_scores_37_transpose_y_0"), val = tensor(false)]; tensor transpose_54_perm_0 = const()[name = tensor("transpose_54_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_55_perm_0 = const()[name = tensor("transpose_55_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_55 = transpose(perm = transpose_55_perm_0, x = x_111)[name = tensor("transpose_69")]; tensor transpose_54 = transpose(perm = transpose_54_perm_0, x = x_119)[name = tensor("transpose_70")]; tensor attention_scores_37 = matmul(transpose_x = attention_scores_37_transpose_x_0, transpose_y = attention_scores_37_transpose_y_0, x = transpose_54, y = transpose_55)[name = tensor("attention_scores_37")]; tensor _inversed_attention_scores_39_y_0 = const()[name = tensor("_inversed_attention_scores_39_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_39 = mul(x = attention_scores_37, y = _inversed_attention_scores_39_y_0)[name = tensor("_inversed_attention_scores_39")]; tensor input_209 = add(x = _inversed_attention_scores_39, y = attention_mask_1)[name = tensor("input_209")]; tensor input_211 = softmax(axis = var_10, x = input_209)[name = tensor("input_211")]; tensor context_layer_37_transpose_x_0 = const()[name = tensor("context_layer_37_transpose_x_0"), val = tensor(false)]; tensor context_layer_37_transpose_y_0 = const()[name = tensor("context_layer_37_transpose_y_0"), val = tensor(false)]; tensor value_layer_19 = transpose(perm = var_814, x = x_115)[name = tensor("transpose_71")]; tensor context_layer_37 = matmul(transpose_x = context_layer_37_transpose_x_0, transpose_y = context_layer_37_transpose_y_0, x = input_211, y = value_layer_19)[name = tensor("context_layer_37")]; tensor var_830 = const()[name = tensor("op_830"), val = tensor([0, 2, 1, 3])]; tensor var_835 = const()[name = tensor("op_835"), val = tensor([1, 512, 768])]; tensor var_831 = transpose(perm = var_830, x = context_layer_37)[name = tensor("transpose_68")]; tensor input_213 = reshape(shape = var_835, x = var_831)[name = tensor("input_213")]; tensor input_215 = linear(bias = text_branch_encoder_layer_9_attention_output_dense_bias, weight = text_branch_encoder_layer_9_attention_output_dense_weight, x = input_213)[name = tensor("linear_57")]; tensor input_217 = add(x = input_215, y = input_207)[name = tensor("input_217")]; tensor input_219_axes_0 = const()[name = tensor("input_219_axes_0"), val = tensor([-1])]; tensor input_219 = layer_norm(axes = input_219_axes_0, beta = text_branch_encoder_layer_9_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_9_attention_output_LayerNorm_weight, x = input_217)[name = tensor("input_219")]; tensor input_221 = linear(bias = text_branch_encoder_layer_9_intermediate_dense_bias, weight = text_branch_encoder_layer_9_intermediate_dense_weight, x = input_219)[name = tensor("linear_58")]; tensor input_223_mode_0 = const()[name = tensor("input_223_mode_0"), val = tensor("EXACT")]; tensor input_223 = gelu(mode = input_223_mode_0, x = input_221)[name = tensor("input_223")]; tensor input_225 = linear(bias = text_branch_encoder_layer_9_output_dense_bias, weight = text_branch_encoder_layer_9_output_dense_weight, x = input_223)[name = tensor("linear_59")]; tensor input_227 = add(x = input_225, y = input_219)[name = tensor("input_227")]; tensor input_229_axes_0 = const()[name = tensor("input_229_axes_0"), val = tensor([-1])]; tensor input_229 = layer_norm(axes = input_229_axes_0, beta = text_branch_encoder_layer_9_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_9_output_LayerNorm_weight, x = input_227)[name = tensor("input_229")]; tensor x_129 = linear(bias = text_branch_encoder_layer_10_attention_self_query_bias, weight = text_branch_encoder_layer_10_attention_self_query_weight, x = input_229)[name = tensor("linear_60")]; tensor x_121 = linear(bias = text_branch_encoder_layer_10_attention_self_key_bias, weight = text_branch_encoder_layer_10_attention_self_key_weight, x = input_229)[name = tensor("linear_61")]; tensor var_880 = const()[name = tensor("op_880"), val = tensor([1, 512, 12, 64])]; tensor x_123 = reshape(shape = var_880, x = x_121)[name = tensor("x_123")]; tensor x_125 = linear(bias = text_branch_encoder_layer_10_attention_self_value_bias, weight = text_branch_encoder_layer_10_attention_self_value_weight, x = input_229)[name = tensor("linear_62")]; tensor var_889 = const()[name = tensor("op_889"), val = tensor([1, 512, 12, 64])]; tensor x_127 = reshape(shape = var_889, x = x_125)[name = tensor("x_127")]; tensor var_891 = const()[name = tensor("op_891"), val = tensor([0, 2, 1, 3])]; tensor var_895 = const()[name = tensor("op_895"), val = tensor([1, 512, 12, 64])]; tensor x_131 = reshape(shape = var_895, x = x_129)[name = tensor("x_131")]; tensor attention_scores_41_transpose_x_0 = const()[name = tensor("attention_scores_41_transpose_x_0"), val = tensor(false)]; tensor attention_scores_41_transpose_y_0 = const()[name = tensor("attention_scores_41_transpose_y_0"), val = tensor(false)]; tensor transpose_56_perm_0 = const()[name = tensor("transpose_56_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_57_perm_0 = const()[name = tensor("transpose_57_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_57 = transpose(perm = transpose_57_perm_0, x = x_123)[name = tensor("transpose_65")]; tensor transpose_56 = transpose(perm = transpose_56_perm_0, x = x_131)[name = tensor("transpose_66")]; tensor attention_scores_41 = matmul(transpose_x = attention_scores_41_transpose_x_0, transpose_y = attention_scores_41_transpose_y_0, x = transpose_56, y = transpose_57)[name = tensor("attention_scores_41")]; tensor _inversed_attention_scores_43_y_0 = const()[name = tensor("_inversed_attention_scores_43_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores_43 = mul(x = attention_scores_41, y = _inversed_attention_scores_43_y_0)[name = tensor("_inversed_attention_scores_43")]; tensor input_231 = add(x = _inversed_attention_scores_43, y = attention_mask_1)[name = tensor("input_231")]; tensor input_233 = softmax(axis = var_10, x = input_231)[name = tensor("input_233")]; tensor context_layer_41_transpose_x_0 = const()[name = tensor("context_layer_41_transpose_x_0"), val = tensor(false)]; tensor context_layer_41_transpose_y_0 = const()[name = tensor("context_layer_41_transpose_y_0"), val = tensor(false)]; tensor value_layer_21 = transpose(perm = var_891, x = x_127)[name = tensor("transpose_67")]; tensor context_layer_41 = matmul(transpose_x = context_layer_41_transpose_x_0, transpose_y = context_layer_41_transpose_y_0, x = input_233, y = value_layer_21)[name = tensor("context_layer_41")]; tensor var_907 = const()[name = tensor("op_907"), val = tensor([0, 2, 1, 3])]; tensor var_912 = const()[name = tensor("op_912"), val = tensor([1, 512, 768])]; tensor var_908 = transpose(perm = var_907, x = context_layer_41)[name = tensor("transpose_64")]; tensor input_235 = reshape(shape = var_912, x = var_908)[name = tensor("input_235")]; tensor input_237 = linear(bias = text_branch_encoder_layer_10_attention_output_dense_bias, weight = text_branch_encoder_layer_10_attention_output_dense_weight, x = input_235)[name = tensor("linear_63")]; tensor input_239 = add(x = input_237, y = input_229)[name = tensor("input_239")]; tensor input_241_axes_0 = const()[name = tensor("input_241_axes_0"), val = tensor([-1])]; tensor input_241 = layer_norm(axes = input_241_axes_0, beta = text_branch_encoder_layer_10_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_10_attention_output_LayerNorm_weight, x = input_239)[name = tensor("input_241")]; tensor input_243 = linear(bias = text_branch_encoder_layer_10_intermediate_dense_bias, weight = text_branch_encoder_layer_10_intermediate_dense_weight, x = input_241)[name = tensor("linear_64")]; tensor input_245_mode_0 = const()[name = tensor("input_245_mode_0"), val = tensor("EXACT")]; tensor input_245 = gelu(mode = input_245_mode_0, x = input_243)[name = tensor("input_245")]; tensor input_247 = linear(bias = text_branch_encoder_layer_10_output_dense_bias, weight = text_branch_encoder_layer_10_output_dense_weight, x = input_245)[name = tensor("linear_65")]; tensor input_249 = add(x = input_247, y = input_241)[name = tensor("input_249")]; tensor input_251_axes_0 = const()[name = tensor("input_251_axes_0"), val = tensor([-1])]; tensor input_251 = layer_norm(axes = input_251_axes_0, beta = text_branch_encoder_layer_10_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_10_output_LayerNorm_weight, x = input_249)[name = tensor("input_251")]; tensor x_141 = linear(bias = text_branch_encoder_layer_11_attention_self_query_bias, weight = text_branch_encoder_layer_11_attention_self_query_weight, x = input_251)[name = tensor("linear_66")]; tensor x_133 = linear(bias = text_branch_encoder_layer_11_attention_self_key_bias, weight = text_branch_encoder_layer_11_attention_self_key_weight, x = input_251)[name = tensor("linear_67")]; tensor var_957 = const()[name = tensor("op_957"), val = tensor([1, 512, 12, 64])]; tensor x_135 = reshape(shape = var_957, x = x_133)[name = tensor("x_135")]; tensor x_137 = linear(bias = text_branch_encoder_layer_11_attention_self_value_bias, weight = text_branch_encoder_layer_11_attention_self_value_weight, x = input_251)[name = tensor("linear_68")]; tensor var_966 = const()[name = tensor("op_966"), val = tensor([1, 512, 12, 64])]; tensor x_139 = reshape(shape = var_966, x = x_137)[name = tensor("x_139")]; tensor var_968 = const()[name = tensor("op_968"), val = tensor([0, 2, 1, 3])]; tensor var_972 = const()[name = tensor("op_972"), val = tensor([1, 512, 12, 64])]; tensor x = reshape(shape = var_972, x = x_141)[name = tensor("x")]; tensor attention_scores_45_transpose_x_0 = const()[name = tensor("attention_scores_45_transpose_x_0"), val = tensor(false)]; tensor attention_scores_45_transpose_y_0 = const()[name = tensor("attention_scores_45_transpose_y_0"), val = tensor(false)]; tensor transpose_58_perm_0 = const()[name = tensor("transpose_58_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_59_perm_0 = const()[name = tensor("transpose_59_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_59 = transpose(perm = transpose_59_perm_0, x = x_135)[name = tensor("transpose_61")]; tensor transpose_58 = transpose(perm = transpose_58_perm_0, x = x)[name = tensor("transpose_62")]; tensor attention_scores_45 = matmul(transpose_x = attention_scores_45_transpose_x_0, transpose_y = attention_scores_45_transpose_y_0, x = transpose_58, y = transpose_59)[name = tensor("attention_scores_45")]; tensor _inversed_attention_scores_y_0 = const()[name = tensor("_inversed_attention_scores_y_0"), val = tensor(0x1p-3)]; tensor _inversed_attention_scores = mul(x = attention_scores_45, y = _inversed_attention_scores_y_0)[name = tensor("_inversed_attention_scores")]; tensor input_253 = add(x = _inversed_attention_scores, y = attention_mask_1)[name = tensor("input_253")]; tensor input_255 = softmax(axis = var_10, x = input_253)[name = tensor("input_255")]; tensor context_layer_45_transpose_x_0 = const()[name = tensor("context_layer_45_transpose_x_0"), val = tensor(false)]; tensor context_layer_45_transpose_y_0 = const()[name = tensor("context_layer_45_transpose_y_0"), val = tensor(false)]; tensor value_layer = transpose(perm = var_968, x = x_139)[name = tensor("transpose_63")]; tensor context_layer_45 = matmul(transpose_x = context_layer_45_transpose_x_0, transpose_y = context_layer_45_transpose_y_0, x = input_255, y = value_layer)[name = tensor("context_layer_45")]; tensor var_984 = const()[name = tensor("op_984"), val = tensor([0, 2, 1, 3])]; tensor var_989 = const()[name = tensor("op_989"), val = tensor([1, 512, 768])]; tensor var_985 = transpose(perm = var_984, x = context_layer_45)[name = tensor("transpose_60")]; tensor input_257 = reshape(shape = var_989, x = var_985)[name = tensor("input_257")]; tensor input_259 = linear(bias = text_branch_encoder_layer_11_attention_output_dense_bias, weight = text_branch_encoder_layer_11_attention_output_dense_weight, x = input_257)[name = tensor("linear_69")]; tensor input_261 = add(x = input_259, y = input_251)[name = tensor("input_261")]; tensor input_263_axes_0 = const()[name = tensor("input_263_axes_0"), val = tensor([-1])]; tensor input_263 = layer_norm(axes = input_263_axes_0, beta = text_branch_encoder_layer_11_attention_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_11_attention_output_LayerNorm_weight, x = input_261)[name = tensor("input_263")]; tensor input_265 = linear(bias = text_branch_encoder_layer_11_intermediate_dense_bias, weight = text_branch_encoder_layer_11_intermediate_dense_weight, x = input_263)[name = tensor("linear_70")]; tensor input_267_mode_0 = const()[name = tensor("input_267_mode_0"), val = tensor("EXACT")]; tensor input_267 = gelu(mode = input_267_mode_0, x = input_265)[name = tensor("input_267")]; tensor input_269 = linear(bias = text_branch_encoder_layer_11_output_dense_bias, weight = text_branch_encoder_layer_11_output_dense_weight, x = input_267)[name = tensor("linear_71")]; tensor input_271 = add(x = input_269, y = input_263)[name = tensor("input_271")]; tensor hidden_states_axes_0 = const()[name = tensor("hidden_states_axes_0"), val = tensor([-1])]; tensor hidden_states = layer_norm(axes = hidden_states_axes_0, beta = text_branch_encoder_layer_11_output_LayerNorm_bias, epsilon = var_12, gamma = text_branch_encoder_layer_11_output_LayerNorm_weight, x = input_271)[name = tensor("hidden_states")]; tensor input_273_begin_0 = const()[name = tensor("input_273_begin_0"), val = tensor([0, 0, 0])]; tensor input_273_end_0 = const()[name = tensor("input_273_end_0"), val = tensor([1, 1, 768])]; tensor input_273_end_mask_0 = const()[name = tensor("input_273_end_mask_0"), val = tensor([true, false, true])]; tensor input_273_squeeze_mask_0 = const()[name = tensor("input_273_squeeze_mask_0"), val = tensor([false, true, false])]; tensor input_273 = slice_by_index(begin = input_273_begin_0, end = input_273_end_0, end_mask = input_273_end_mask_0, squeeze_mask = input_273_squeeze_mask_0, x = hidden_states)[name = tensor("input_273")]; tensor input_275 = linear(bias = text_branch_pooler_dense_bias, weight = text_branch_pooler_dense_weight, x = input_273)[name = tensor("linear_72")]; tensor input_277 = tanh(x = input_275)[name = tensor("input_277")]; tensor input_279 = linear(bias = text_projection_0_bias, weight = text_projection_0_weight, x = input_277)[name = tensor("linear_73")]; tensor input_281 = relu(x = input_279)[name = tensor("input_281")]; tensor input = linear(bias = text_projection_2_bias, weight = text_projection_2_weight, x = input_281)[name = tensor("linear_74")]; tensor var_1036 = const()[name = tensor("op_1036"), val = tensor([-1])]; tensor var_1037 = const()[name = tensor("op_1037"), val = tensor(true)]; tensor var_1039 = reduce_l2_norm(axes = var_1036, keep_dims = var_1037, x = input)[name = tensor("op_1039")]; tensor var_1040 = const()[name = tensor("op_1040"), val = tensor(0x1.197998p-40)]; tensor var_1041 = maximum(x = var_1039, y = var_1040)[name = tensor("op_1041")]; tensor denom_reps_0 = const()[name = tensor("denom_reps_0"), val = tensor([1, 512])]; tensor denom = tile(reps = denom_reps_0, x = var_1041)[name = tensor("denom")]; tensor text_embedding = real_div(x = input, y = denom)[name = tensor("op_1043")]; } -> (text_embedding); }