diff --git "a/graphs/text_encoder.json" "b/graphs/text_encoder.json" new file mode 100644--- /dev/null +++ "b/graphs/text_encoder.json" @@ -0,0 +1,16427 @@ +{ + "ir_version": 9, + "opsets": [ + { + "domain": "", + "version": 19 + } + ], + "inputs": [ + "text_ids", + "style_ttl", + "text_mask" + ], + "outputs": [ + "text_emb" + ], + "weight_map": { + "tts.ttl.text_encoder.text_embedder.char_embedder.weight": "w000000", + "tts.ttl.text_encoder.convnext.convnext.0.gamma": "w000001", + "tts.ttl.text_encoder.convnext.convnext.0.dwconv.weight": "w000002", + "tts.ttl.text_encoder.convnext.convnext.0.dwconv.bias": "w000003", + "tts.ttl.text_encoder.convnext.convnext.0.norm.norm.weight": "w000004", + "tts.ttl.text_encoder.convnext.convnext.0.norm.norm.bias": "w000005", + "tts.ttl.text_encoder.convnext.convnext.0.pwconv1.weight": "w000006", + "tts.ttl.text_encoder.convnext.convnext.0.pwconv1.bias": "w000007", + "tts.ttl.text_encoder.convnext.convnext.0.pwconv2.weight": "w000008", + "tts.ttl.text_encoder.convnext.convnext.0.pwconv2.bias": "w000009", + "tts.ttl.text_encoder.convnext.convnext.1.gamma": "w000010", + "tts.ttl.text_encoder.convnext.convnext.1.dwconv.weight": "w000011", + "tts.ttl.text_encoder.convnext.convnext.1.dwconv.bias": "w000012", + "tts.ttl.text_encoder.convnext.convnext.1.norm.norm.weight": "w000013", + "tts.ttl.text_encoder.convnext.convnext.1.norm.norm.bias": "w000014", + "tts.ttl.text_encoder.convnext.convnext.1.pwconv1.weight": "w000015", + "tts.ttl.text_encoder.convnext.convnext.1.pwconv1.bias": "w000016", + "tts.ttl.text_encoder.convnext.convnext.1.pwconv2.weight": "w000017", + "tts.ttl.text_encoder.convnext.convnext.1.pwconv2.bias": "w000018", + "tts.ttl.text_encoder.convnext.convnext.2.gamma": "w000019", + "tts.ttl.text_encoder.convnext.convnext.2.dwconv.weight": "w000020", + "tts.ttl.text_encoder.convnext.convnext.2.dwconv.bias": "w000021", + "tts.ttl.text_encoder.convnext.convnext.2.norm.norm.weight": "w000022", + "tts.ttl.text_encoder.convnext.convnext.2.norm.norm.bias": "w000023", + "tts.ttl.text_encoder.convnext.convnext.2.pwconv1.weight": "w000024", + "tts.ttl.text_encoder.convnext.convnext.2.pwconv1.bias": "w000025", + "tts.ttl.text_encoder.convnext.convnext.2.pwconv2.weight": "w000026", + "tts.ttl.text_encoder.convnext.convnext.2.pwconv2.bias": "w000027", + "tts.ttl.text_encoder.convnext.convnext.3.gamma": "w000028", + "tts.ttl.text_encoder.convnext.convnext.3.dwconv.weight": "w000029", + "tts.ttl.text_encoder.convnext.convnext.3.dwconv.bias": "w000030", + "tts.ttl.text_encoder.convnext.convnext.3.norm.norm.weight": "w000031", + "tts.ttl.text_encoder.convnext.convnext.3.norm.norm.bias": "w000032", + "tts.ttl.text_encoder.convnext.convnext.3.pwconv1.weight": "w000033", + "tts.ttl.text_encoder.convnext.convnext.3.pwconv1.bias": "w000034", + "tts.ttl.text_encoder.convnext.convnext.3.pwconv2.weight": "w000035", + "tts.ttl.text_encoder.convnext.convnext.3.pwconv2.bias": "w000036", + "tts.ttl.text_encoder.convnext.convnext.4.gamma": "w000037", + "tts.ttl.text_encoder.convnext.convnext.4.dwconv.weight": "w000038", + "tts.ttl.text_encoder.convnext.convnext.4.dwconv.bias": "w000039", + "tts.ttl.text_encoder.convnext.convnext.4.norm.norm.weight": "w000040", + "tts.ttl.text_encoder.convnext.convnext.4.norm.norm.bias": "w000041", + "tts.ttl.text_encoder.convnext.convnext.4.pwconv1.weight": "w000042", + "tts.ttl.text_encoder.convnext.convnext.4.pwconv1.bias": "w000043", + "tts.ttl.text_encoder.convnext.convnext.4.pwconv2.weight": "w000044", + "tts.ttl.text_encoder.convnext.convnext.4.pwconv2.bias": "w000045", + "tts.ttl.text_encoder.convnext.convnext.5.gamma": "w000046", + "tts.ttl.text_encoder.convnext.convnext.5.dwconv.weight": "w000047", + "tts.ttl.text_encoder.convnext.convnext.5.dwconv.bias": "w000048", + "tts.ttl.text_encoder.convnext.convnext.5.norm.norm.weight": "w000049", + "tts.ttl.text_encoder.convnext.convnext.5.norm.norm.bias": "w000050", + "tts.ttl.text_encoder.convnext.convnext.5.pwconv1.weight": "w000051", + "tts.ttl.text_encoder.convnext.convnext.5.pwconv1.bias": "w000052", + "tts.ttl.text_encoder.convnext.convnext.5.pwconv2.weight": "w000053", + "tts.ttl.text_encoder.convnext.convnext.5.pwconv2.bias": "w000054", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.emb_rel_k": "w000055", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.emb_rel_v": "w000056", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_q.weight": "w000057", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_q.bias": "w000058", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_k.weight": "w000059", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_k.bias": "w000060", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_v.weight": "w000061", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_v.bias": "w000062", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_o.weight": "w000063", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_o.bias": "w000064", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.emb_rel_k": "w000065", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.emb_rel_v": "w000066", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_q.weight": "w000067", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_q.bias": "w000068", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_k.weight": "w000069", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_k.bias": "w000070", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_v.weight": "w000071", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_v.bias": "w000072", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_o.weight": "w000073", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_o.bias": "w000074", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.emb_rel_k": "w000075", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.emb_rel_v": "w000076", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_q.weight": "w000077", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_q.bias": "w000078", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_k.weight": "w000079", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_k.bias": "w000080", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_v.weight": "w000081", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_v.bias": "w000082", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_o.weight": "w000083", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_o.bias": "w000084", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.emb_rel_k": "w000085", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.emb_rel_v": "w000086", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_q.weight": "w000087", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_q.bias": "w000088", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_k.weight": "w000089", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_k.bias": "w000090", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_v.weight": "w000091", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_v.bias": "w000092", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_o.weight": "w000093", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_o.bias": "w000094", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.0.norm.weight": "w000095", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.0.norm.bias": "w000096", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.1.norm.weight": "w000097", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.1.norm.bias": "w000098", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.2.norm.weight": "w000099", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.2.norm.bias": "w000100", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.3.norm.weight": "w000101", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.3.norm.bias": "w000102", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.0.conv_1.weight": "w000103", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.0.conv_1.bias": "w000104", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.0.conv_2.weight": "w000105", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.0.conv_2.bias": "w000106", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.1.conv_1.weight": "w000107", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.1.conv_1.bias": "w000108", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.1.conv_2.weight": "w000109", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.1.conv_2.bias": "w000110", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.2.conv_1.weight": "w000111", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.2.conv_1.bias": "w000112", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.2.conv_2.weight": "w000113", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.2.conv_2.bias": "w000114", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.3.conv_1.weight": "w000115", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.3.conv_1.bias": "w000116", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.3.conv_2.weight": "w000117", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.3.conv_2.bias": "w000118", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.0.norm.weight": "w000119", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.0.norm.bias": "w000120", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.1.norm.weight": "w000121", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.1.norm.bias": "w000122", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.2.norm.weight": "w000123", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.2.norm.bias": "w000124", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.3.norm.weight": "w000125", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.3.norm.bias": "w000126", + "tts.ttl.style_encoder.style_token_layer.style_key": "w000127", + "tts.ttl.speech_prompted_text_encoder.attention1.W_query.linear.bias": "w000128", + "tts.ttl.speech_prompted_text_encoder.attention1.W_key.linear.bias": "w000129", + "tts.ttl.speech_prompted_text_encoder.attention1.W_value.linear.bias": "w000130", + "tts.ttl.speech_prompted_text_encoder.attention1.out_fc.linear.bias": "w000131", + "tts.ttl.speech_prompted_text_encoder.attention2.W_query.linear.bias": "w000132", + "tts.ttl.speech_prompted_text_encoder.attention2.W_key.linear.bias": "w000133", + "tts.ttl.speech_prompted_text_encoder.attention2.W_value.linear.bias": "w000134", + "tts.ttl.speech_prompted_text_encoder.attention2.out_fc.linear.bias": "w000135", + "tts.ttl.speech_prompted_text_encoder.norm.norm.weight": "w000136", + "tts.ttl.speech_prompted_text_encoder.norm.norm.bias": "w000137", + "onnx::MatMul_3680": "w000138", + "onnx::MatMul_3681": "w000139", + "onnx::MatMul_3682": "w000140", + "onnx::MatMul_3683": "w000141", + "onnx::MatMul_3684": "w000142", + "onnx::MatMul_3685": "w000143", + "onnx::MatMul_3686": "w000144", + "onnx::MatMul_3687": "w000145", + "/text_encoder/convnext/convnext.0/dwconv/Constant_output_0": "c000000", + "/text_encoder/convnext/convnext.0/dwconv/Constant_1_output_0": "c000001", + "/text_encoder/convnext/convnext.0/dwconv/Constant_2_output_0": "c000002", + "/text_encoder/convnext/convnext.0/dwconv/Constant_3_output_0": "c000003", + "/text_encoder/convnext/convnext.0/dwconv/Constant_4_output_0": "c000004", + "/text_encoder/convnext/convnext.0/dwconv/Constant_5_output_0": "c000005", + "/text_encoder/convnext/convnext.0/dwconv/Constant_6_output_0": "c000006", + "/text_encoder/convnext/convnext.0/dwconv/Constant_7_output_0": "c000007", + "/text_encoder/convnext/convnext.0/act/Constant_output_0": "c000008", + "/text_encoder/convnext/convnext.0/act/Constant_1_output_0": "c000009", + "/text_encoder/convnext/convnext.0/act/Constant_2_output_0": "c000010", + "/text_encoder/convnext/convnext.1/dwconv/Constant_output_0": "c000011", + "/text_encoder/convnext/convnext.1/dwconv/Constant_1_output_0": "c000012", + "/text_encoder/convnext/convnext.1/dwconv/Constant_2_output_0": "c000013", + "/text_encoder/convnext/convnext.1/dwconv/Constant_3_output_0": "c000014", + "/text_encoder/convnext/convnext.1/dwconv/Constant_4_output_0": "c000015", + "/text_encoder/convnext/convnext.1/dwconv/Constant_5_output_0": "c000016", + "/text_encoder/convnext/convnext.1/dwconv/Constant_6_output_0": "c000017", + "/text_encoder/convnext/convnext.1/dwconv/Constant_7_output_0": "c000018", + "/text_encoder/convnext/convnext.1/act/Constant_output_0": "c000019", + "/text_encoder/convnext/convnext.1/act/Constant_1_output_0": "c000020", + "/text_encoder/convnext/convnext.1/act/Constant_2_output_0": "c000021", + "/text_encoder/convnext/convnext.2/dwconv/Constant_output_0": "c000022", + "/text_encoder/convnext/convnext.2/dwconv/Constant_1_output_0": "c000023", + "/text_encoder/convnext/convnext.2/dwconv/Constant_2_output_0": "c000024", + "/text_encoder/convnext/convnext.2/dwconv/Constant_3_output_0": "c000025", + "/text_encoder/convnext/convnext.2/dwconv/Constant_4_output_0": "c000026", + "/text_encoder/convnext/convnext.2/dwconv/Constant_5_output_0": "c000027", + "/text_encoder/convnext/convnext.2/dwconv/Constant_6_output_0": "c000028", + "/text_encoder/convnext/convnext.2/dwconv/Constant_7_output_0": "c000029", + "/text_encoder/convnext/convnext.2/act/Constant_output_0": "c000030", + "/text_encoder/convnext/convnext.2/act/Constant_1_output_0": "c000031", + "/text_encoder/convnext/convnext.2/act/Constant_2_output_0": "c000032", + "/text_encoder/convnext/convnext.3/dwconv/Constant_output_0": "c000033", + "/text_encoder/convnext/convnext.3/dwconv/Constant_1_output_0": "c000034", + "/text_encoder/convnext/convnext.3/dwconv/Constant_2_output_0": "c000035", + "/text_encoder/convnext/convnext.3/dwconv/Constant_3_output_0": "c000036", + "/text_encoder/convnext/convnext.3/dwconv/Constant_4_output_0": "c000037", + "/text_encoder/convnext/convnext.3/dwconv/Constant_5_output_0": "c000038", + "/text_encoder/convnext/convnext.3/dwconv/Constant_6_output_0": "c000039", + "/text_encoder/convnext/convnext.3/dwconv/Constant_7_output_0": "c000040", + "/text_encoder/convnext/convnext.3/act/Constant_output_0": "c000041", + "/text_encoder/convnext/convnext.3/act/Constant_1_output_0": "c000042", + "/text_encoder/convnext/convnext.3/act/Constant_2_output_0": "c000043", + "/text_encoder/convnext/convnext.4/dwconv/Constant_output_0": "c000044", + "/text_encoder/convnext/convnext.4/dwconv/Constant_1_output_0": "c000045", + "/text_encoder/convnext/convnext.4/dwconv/Constant_2_output_0": "c000046", + "/text_encoder/convnext/convnext.4/dwconv/Constant_3_output_0": "c000047", + "/text_encoder/convnext/convnext.4/dwconv/Constant_4_output_0": "c000048", + "/text_encoder/convnext/convnext.4/dwconv/Constant_5_output_0": "c000049", + "/text_encoder/convnext/convnext.4/dwconv/Constant_6_output_0": "c000050", + "/text_encoder/convnext/convnext.4/dwconv/Constant_7_output_0": "c000051", + "/text_encoder/convnext/convnext.4/act/Constant_output_0": "c000052", + "/text_encoder/convnext/convnext.4/act/Constant_1_output_0": "c000053", + "/text_encoder/convnext/convnext.4/act/Constant_2_output_0": "c000054", + "/text_encoder/convnext/convnext.5/dwconv/Constant_output_0": "c000055", + "/text_encoder/convnext/convnext.5/dwconv/Constant_1_output_0": "c000056", + "/text_encoder/convnext/convnext.5/dwconv/Constant_2_output_0": "c000057", + "/text_encoder/convnext/convnext.5/dwconv/Constant_3_output_0": "c000058", + "/text_encoder/convnext/convnext.5/dwconv/Constant_4_output_0": "c000059", + "/text_encoder/convnext/convnext.5/dwconv/Constant_5_output_0": "c000060", + "/text_encoder/convnext/convnext.5/dwconv/Constant_6_output_0": "c000061", + "/text_encoder/convnext/convnext.5/dwconv/Constant_7_output_0": "c000062", + "/text_encoder/convnext/convnext.5/act/Constant_output_0": "c000063", + "/text_encoder/convnext/convnext.5/act/Constant_1_output_0": "c000064", + "/text_encoder/convnext/convnext.5/act/Constant_2_output_0": "c000065", + "/text_encoder/attn_encoder/Constant_output_0": "c000066", + "/text_encoder/attn_encoder/Constant_1_output_0": "c000067", + "/text_encoder/attn_encoder/attn_layers.0/Constant_output_0": "c000068", + "/text_encoder/attn_encoder/attn_layers.0/Constant_1_output_0": "c000069", + "/text_encoder/attn_encoder/attn_layers.0/Constant_2_output_0": "c000070", + "/text_encoder/attn_encoder/attn_layers.0/Constant_3_output_0": "c000071", + "onnx::Unsqueeze_1234": "c000072", + "/text_encoder/attn_encoder/attn_layers.0/Constant_4_output_0": "c000073", + "/text_encoder/attn_encoder/attn_layers.0/Constant_5_output_0": "c000074", + "onnx::Unsqueeze_1240": "c000075", + "onnx::Unsqueeze_1246": "c000076", + "/text_encoder/attn_encoder/attn_layers.0/Constant_6_output_0": "c000077", + "/text_encoder/attn_encoder/attn_layers.0/Constant_7_output_0": "c000078", + "onnx::Unsqueeze_1252": "c000079", + "onnx::Unsqueeze_1255": "c000080", + "/text_encoder/attn_encoder/attn_layers.0/Constant_8_output_0": "c000081", + "/text_encoder/attn_encoder/attn_layers.0/Constant_9_output_0": "c000082", + "onnx::Unsqueeze_1261": "c000083", + "/text_encoder/attn_encoder/attn_layers.0/Constant_10_output_0": "c000084", + "/text_encoder/attn_encoder/attn_layers.0/Constant_11_output_0": "c000085", + "/text_encoder/attn_encoder/attn_layers.0/Constant_12_output_0": "c000086", + "/text_encoder/attn_encoder/attn_layers.0/Constant_13_output_0": "c000087", + "/text_encoder/attn_encoder/attn_layers.0/Constant_14_output_0": "c000088", + "/text_encoder/attn_encoder/attn_layers.0/Constant_15_output_0": "c000089", + "/text_encoder/attn_encoder/attn_layers.0/Constant_16_output_0": "c000090", + "/text_encoder/attn_encoder/attn_layers.0/Constant_17_output_0": "c000091", + "/text_encoder/attn_encoder/attn_layers.0/Constant_18_output_0": "c000092", + "onnx::Unsqueeze_1291": "c000093", + "onnx::Unsqueeze_1293": "c000094", + "/text_encoder/attn_encoder/attn_layers.0/Constant_19_output_0": "c000095", + "/text_encoder/attn_encoder/attn_layers.0/Constant_20_output_0": "c000096", + "/text_encoder/attn_encoder/attn_layers.0/Constant_21_output_0": "c000097", + "/text_encoder/attn_encoder/attn_layers.0/Constant_22_output_0": "c000098", + "onnx::Unsqueeze_1304": "c000099", + "onnx::Unsqueeze_1306": "c000100", + "/text_encoder/attn_encoder/attn_layers.0/Constant_23_output_0": "c000101", + "/text_encoder/attn_encoder/attn_layers.0/Constant_24_output_0": "c000102", + "/text_encoder/attn_encoder/attn_layers.0/Constant_25_output_0": "c000103", + "/text_encoder/attn_encoder/attn_layers.0/Constant_26_output_0": "c000104", + "onnx::Unsqueeze_1317": "c000105", + "onnx::Unsqueeze_1319": "c000106", + "/text_encoder/attn_encoder/attn_layers.0/Constant_27_output_0": "c000107", + "/text_encoder/attn_encoder/attn_layers.0/Constant_28_output_0": "c000108", + "/text_encoder/attn_encoder/attn_layers.0/Constant_29_output_0": "c000109", + "/text_encoder/attn_encoder/attn_layers.0/Constant_30_output_0": "c000110", + "onnx::Unsqueeze_1330": "c000111", + "onnx::Unsqueeze_1332": "c000112", + "/text_encoder/attn_encoder/attn_layers.0/Constant_31_output_0": "c000113", + "/text_encoder/attn_encoder/attn_layers.0/Constant_32_output_0": "c000114", + "/text_encoder/attn_encoder/attn_layers.0/Constant_33_output_0": "c000115", + "/text_encoder/attn_encoder/attn_layers.0/Constant_34_output_0": "c000116", + "/text_encoder/attn_encoder/attn_layers.0/Constant_35_output_0": "c000117", + "/text_encoder/attn_encoder/attn_layers.0/Constant_36_output_0": "c000118", + "/text_encoder/attn_encoder/attn_layers.0/Constant_37_output_0": "c000119", + "/text_encoder/attn_encoder/attn_layers.0/Constant_38_output_0": "c000120", + "/text_encoder/attn_encoder/attn_layers.0/Constant_39_output_0": "c000121", + "/text_encoder/attn_encoder/attn_layers.0/Constant_40_output_0": "c000122", + "/text_encoder/attn_encoder/attn_layers.0/Constant_41_output_0": "c000123", + "/text_encoder/attn_encoder/attn_layers.0/Constant_42_output_0": "c000124", + "/text_encoder/attn_encoder/attn_layers.0/Constant_43_output_0": "c000125", + "/text_encoder/attn_encoder/attn_layers.0/Constant_44_output_0": "c000126", + "/text_encoder/attn_encoder/attn_layers.0/Constant_45_output_0": "c000127", + "/text_encoder/attn_encoder/attn_layers.0/Constant_46_output_0": "c000128", + "/text_encoder/attn_encoder/attn_layers.0/Constant_47_output_0": "c000129", + "/text_encoder/attn_encoder/attn_layers.0/Constant_48_output_0": "c000130", + "/text_encoder/attn_encoder/attn_layers.0/Constant_49_output_0": "c000131", + "/text_encoder/attn_encoder/attn_layers.0/Constant_50_output_0": "c000132", + "/text_encoder/attn_encoder/attn_layers.0/Constant_51_output_0": "c000133", + "/text_encoder/attn_encoder/attn_layers.0/Constant_52_output_0": "c000134", + "/text_encoder/attn_encoder/attn_layers.0/Constant_53_output_0": "c000135", + "/text_encoder/attn_encoder/attn_layers.0/Constant_54_output_0": "c000136", + "/text_encoder/attn_encoder/attn_layers.0/Constant_55_output_0": "c000137", + "/text_encoder/attn_encoder/attn_layers.0/Constant_56_output_0": "c000138", + "/text_encoder/attn_encoder/attn_layers.0/Constant_57_output_0": "c000139", + "onnx::Unsqueeze_1410": "c000140", + "onnx::Unsqueeze_1412": "c000141", + "onnx::Unsqueeze_1414": "c000142", + "/text_encoder/attn_encoder/attn_layers.0/Constant_58_output_0": "c000143", + "/text_encoder/attn_encoder/attn_layers.0/Constant_59_output_0": "c000144", + "onnx::Unsqueeze_1422": "c000145", + "/text_encoder/attn_encoder/attn_layers.0/Constant_60_output_0": "c000146", + "/text_encoder/attn_encoder/attn_layers.0/Constant_61_output_0": "c000147", + "/text_encoder/attn_encoder/attn_layers.0/Constant_62_output_0": "c000148", + "/text_encoder/attn_encoder/attn_layers.0/Constant_63_output_0": "c000149", + "/text_encoder/attn_encoder/attn_layers.0/Constant_64_output_0": "c000150", + "onnx::Unsqueeze_1435": "c000151", + "/text_encoder/attn_encoder/attn_layers.0/Constant_65_output_0": "c000152", + "/text_encoder/attn_encoder/attn_layers.0/Constant_66_output_0": "c000153", + "/text_encoder/attn_encoder/attn_layers.0/Constant_67_output_0": "c000154", + "/text_encoder/attn_encoder/attn_layers.0/Constant_68_output_0": "c000155", + "/text_encoder/attn_encoder/attn_layers.0/Constant_69_output_0": "c000156", + "/text_encoder/attn_encoder/attn_layers.0/Constant_70_output_0": "c000157", + "/text_encoder/attn_encoder/attn_layers.0/Constant_71_output_0": "c000158", + "/text_encoder/attn_encoder/attn_layers.0/Constant_72_output_0": "c000159", + "/text_encoder/attn_encoder/attn_layers.0/Constant_73_output_0": "c000160", + "/text_encoder/attn_encoder/attn_layers.0/Constant_74_output_0": "c000161", + "/text_encoder/attn_encoder/attn_layers.0/Constant_75_output_0": "c000162", + "/text_encoder/attn_encoder/attn_layers.0/Constant_76_output_0": "c000163", + "/text_encoder/attn_encoder/attn_layers.0/Constant_77_output_0": "c000164", + "/text_encoder/attn_encoder/attn_layers.0/Constant_78_output_0": "c000165", + "onnx::Unsqueeze_1472": "c000166", + "onnx::Unsqueeze_1474": "c000167", + "onnx::Unsqueeze_1476": "c000168", + "onnx::Unsqueeze_1478": "c000169", + "/text_encoder/attn_encoder/attn_layers.0/Constant_79_output_0": "c000170", + "/text_encoder/attn_encoder/attn_layers.0/Constant_80_output_0": "c000171", + "/text_encoder/attn_encoder/attn_layers.0/Constant_81_output_0": "c000172", + "/text_encoder/attn_encoder/attn_layers.0/Constant_82_output_0": "c000173", + "/text_encoder/attn_encoder/attn_layers.0/Constant_83_output_0": "c000174", + "/text_encoder/attn_encoder/attn_layers.0/Constant_84_output_0": "c000175", + "/text_encoder/attn_encoder/attn_layers.0/Constant_85_output_0": "c000176", + "/text_encoder/attn_encoder/attn_layers.0/Constant_86_output_0": "c000177", + "/text_encoder/attn_encoder/attn_layers.0/Constant_87_output_0": "c000178", + "/text_encoder/attn_encoder/attn_layers.0/Constant_88_output_0": "c000179", + "/text_encoder/attn_encoder/attn_layers.0/Constant_89_output_0": "c000180", + "/text_encoder/attn_encoder/attn_layers.0/Constant_90_output_0": "c000181", + "/text_encoder/attn_encoder/attn_layers.0/Constant_91_output_0": "c000182", + "/text_encoder/attn_encoder/attn_layers.0/Constant_92_output_0": "c000183", + "/text_encoder/attn_encoder/attn_layers.0/Constant_93_output_0": "c000184", + "onnx::Unsqueeze_1521": "c000185", + "/text_encoder/attn_encoder/attn_layers.0/Constant_94_output_0": "c000186", + "/text_encoder/attn_encoder/attn_layers.0/Constant_95_output_0": "c000187", + "/text_encoder/attn_encoder/attn_layers.0/Constant_96_output_0": "c000188", + "/text_encoder/attn_encoder/attn_layers.0/Constant_97_output_0": "c000189", + "/text_encoder/attn_encoder/attn_layers.0/Constant_98_output_0": "c000190", + "/text_encoder/attn_encoder/attn_layers.0/Constant_99_output_0": "c000191", + "/text_encoder/attn_encoder/attn_layers.0/Constant_100_output_0": "c000192", + "onnx::Unsqueeze_1538": "c000193", + "/text_encoder/attn_encoder/attn_layers.0/Constant_101_output_0": "c000194", + "/text_encoder/attn_encoder/attn_layers.0/Constant_102_output_0": "c000195", + "/text_encoder/attn_encoder/attn_layers.0/Constant_103_output_0": "c000196", + "/text_encoder/attn_encoder/attn_layers.0/Constant_104_output_0": "c000197", + "/text_encoder/attn_encoder/attn_layers.0/Constant_105_output_0": "c000198", + "/text_encoder/attn_encoder/attn_layers.0/Constant_106_output_0": "c000199", + "/text_encoder/attn_encoder/attn_layers.0/Constant_107_output_0": "c000200", + "/text_encoder/attn_encoder/attn_layers.0/Constant_108_output_0": "c000201", + "/text_encoder/attn_encoder/attn_layers.0/Constant_109_output_0": "c000202", + "/text_encoder/attn_encoder/attn_layers.0/Constant_110_output_0": "c000203", + "/text_encoder/attn_encoder/attn_layers.0/Constant_111_output_0": "c000204", + "/text_encoder/attn_encoder/attn_layers.0/Constant_112_output_0": "c000205", + "/text_encoder/attn_encoder/attn_layers.0/Constant_113_output_0": "c000206", + "/text_encoder/attn_encoder/attn_layers.0/Constant_114_output_0": "c000207", + "/text_encoder/attn_encoder/attn_layers.0/Constant_115_output_0": "c000208", + "onnx::Unsqueeze_1579": "c000209", + "onnx::Unsqueeze_1581": "c000210", + "onnx::Unsqueeze_1583": "c000211", + "onnx::Unsqueeze_1587": "c000212", + "/text_encoder/attn_encoder/attn_layers.0/Constant_116_output_0": "c000213", + "/text_encoder/attn_encoder/attn_layers.0/Constant_117_output_0": "c000214", + "/text_encoder/attn_encoder/attn_layers.0/Constant_118_output_0": "c000215", + "/text_encoder/attn_encoder/attn_layers.0/Constant_119_output_0": "c000216", + "/text_encoder/attn_encoder/attn_layers.0/Constant_120_output_0": "c000217", + "onnx::Unsqueeze_1600": "c000218", + "/text_encoder/attn_encoder/attn_layers.0/Constant_121_output_0": "c000219", + "/text_encoder/attn_encoder/attn_layers.0/Constant_122_output_0": "c000220", + "/text_encoder/attn_encoder/attn_layers.0/Constant_123_output_0": "c000221", + "/text_encoder/attn_encoder/attn_layers.0/Constant_124_output_0": "c000222", + "/text_encoder/attn_encoder/attn_layers.0/Constant_125_output_0": "c000223", + "/text_encoder/attn_encoder/attn_layers.0/Constant_126_output_0": "c000224", + "/text_encoder/attn_encoder/attn_layers.0/Constant_127_output_0": "c000225", + "/text_encoder/attn_encoder/attn_layers.0/Constant_128_output_0": "c000226", + "/text_encoder/attn_encoder/attn_layers.0/Constant_129_output_0": "c000227", + "/text_encoder/attn_encoder/attn_layers.0/Constant_130_output_0": "c000228", + "/text_encoder/attn_encoder/attn_layers.0/Constant_131_output_0": "c000229", + "/text_encoder/attn_encoder/attn_layers.0/Constant_132_output_0": "c000230", + "/text_encoder/attn_encoder/attn_layers.0/Constant_133_output_0": "c000231", + "/text_encoder/attn_encoder/attn_layers.0/Constant_134_output_0": "c000232", + "onnx::Unsqueeze_1637": "c000233", + "onnx::Unsqueeze_1639": "c000234", + "onnx::Unsqueeze_1641": "c000235", + "onnx::Unsqueeze_1643": "c000236", + "/text_encoder/attn_encoder/attn_layers.0/Constant_135_output_0": "c000237", + "/text_encoder/attn_encoder/attn_layers.0/Constant_136_output_0": "c000238", + "/text_encoder/attn_encoder/attn_layers.0/Constant_137_output_0": "c000239", + "/text_encoder/attn_encoder/attn_layers.0/Constant_138_output_0": "c000240", + "/text_encoder/attn_encoder/attn_layers.0/Constant_139_output_0": "c000241", + "/text_encoder/attn_encoder/attn_layers.0/Constant_140_output_0": "c000242", + "/text_encoder/attn_encoder/attn_layers.0/Constant_141_output_0": "c000243", + "/text_encoder/attn_encoder/attn_layers.0/Constant_142_output_0": "c000244", + "/text_encoder/attn_encoder/attn_layers.0/Constant_143_output_0": "c000245", + "/text_encoder/attn_encoder/attn_layers.0/Constant_144_output_0": "c000246", + "/text_encoder/attn_encoder/attn_layers.0/Constant_145_output_0": "c000247", + "/text_encoder/attn_encoder/attn_layers.0/Constant_146_output_0": "c000248", + "/text_encoder/attn_encoder/attn_layers.0/Constant_147_output_0": "c000249", + "/text_encoder/attn_encoder/attn_layers.0/Constant_148_output_0": "c000250", + "/text_encoder/attn_encoder/attn_layers.0/Constant_149_output_0": "c000251", + "/text_encoder/attn_encoder/attn_layers.0/Constant_150_output_0": "c000252", + "/text_encoder/attn_encoder/attn_layers.0/Constant_151_output_0": "c000253", + "onnx::Unsqueeze_1692": "c000254", + "onnx::Unsqueeze_1694": "c000255", + "onnx::Unsqueeze_1696": "c000256", + "/text_encoder/attn_encoder/attn_layers.1/Constant_output_0": "c000257", + "/text_encoder/attn_encoder/attn_layers.1/Constant_1_output_0": "c000258", + "/text_encoder/attn_encoder/attn_layers.1/Constant_2_output_0": "c000259", + "/text_encoder/attn_encoder/attn_layers.1/Constant_3_output_0": "c000260", + "onnx::Unsqueeze_1730": "c000261", + "/text_encoder/attn_encoder/attn_layers.1/Constant_4_output_0": "c000262", + "/text_encoder/attn_encoder/attn_layers.1/Constant_5_output_0": "c000263", + "onnx::Unsqueeze_1736": "c000264", + "onnx::Unsqueeze_1741": "c000265", + "/text_encoder/attn_encoder/attn_layers.1/Constant_6_output_0": "c000266", + "/text_encoder/attn_encoder/attn_layers.1/Constant_7_output_0": "c000267", + "onnx::Unsqueeze_1747": "c000268", + "onnx::Unsqueeze_1750": "c000269", + "/text_encoder/attn_encoder/attn_layers.1/Constant_8_output_0": "c000270", + "/text_encoder/attn_encoder/attn_layers.1/Constant_9_output_0": "c000271", + "onnx::Unsqueeze_1756": "c000272", + "/text_encoder/attn_encoder/attn_layers.1/Constant_10_output_0": "c000273", + "/text_encoder/attn_encoder/attn_layers.1/Constant_11_output_0": "c000274", + "/text_encoder/attn_encoder/attn_layers.1/Constant_12_output_0": "c000275", + "/text_encoder/attn_encoder/attn_layers.1/Constant_13_output_0": "c000276", + "/text_encoder/attn_encoder/attn_layers.1/Constant_14_output_0": "c000277", + "/text_encoder/attn_encoder/attn_layers.1/Constant_15_output_0": "c000278", + "/text_encoder/attn_encoder/attn_layers.1/Constant_16_output_0": "c000279", + "/text_encoder/attn_encoder/attn_layers.1/Constant_17_output_0": "c000280", + "/text_encoder/attn_encoder/attn_layers.1/Constant_18_output_0": "c000281", + "onnx::Unsqueeze_1786": "c000282", + "onnx::Unsqueeze_1788": "c000283", + "/text_encoder/attn_encoder/attn_layers.1/Constant_19_output_0": "c000284", + "/text_encoder/attn_encoder/attn_layers.1/Constant_20_output_0": "c000285", + "/text_encoder/attn_encoder/attn_layers.1/Constant_21_output_0": "c000286", + "/text_encoder/attn_encoder/attn_layers.1/Constant_22_output_0": "c000287", + "onnx::Unsqueeze_1799": "c000288", + "onnx::Unsqueeze_1801": "c000289", + "/text_encoder/attn_encoder/attn_layers.1/Constant_23_output_0": "c000290", + "/text_encoder/attn_encoder/attn_layers.1/Constant_24_output_0": "c000291", + "/text_encoder/attn_encoder/attn_layers.1/Constant_25_output_0": "c000292", + "/text_encoder/attn_encoder/attn_layers.1/Constant_26_output_0": "c000293", + "onnx::Unsqueeze_1812": "c000294", + "onnx::Unsqueeze_1814": "c000295", + "/text_encoder/attn_encoder/attn_layers.1/Constant_27_output_0": "c000296", + "/text_encoder/attn_encoder/attn_layers.1/Constant_28_output_0": "c000297", + "/text_encoder/attn_encoder/attn_layers.1/Constant_29_output_0": "c000298", + "/text_encoder/attn_encoder/attn_layers.1/Constant_30_output_0": "c000299", + "onnx::Unsqueeze_1825": "c000300", + "onnx::Unsqueeze_1827": "c000301", + "/text_encoder/attn_encoder/attn_layers.1/Constant_31_output_0": "c000302", + "/text_encoder/attn_encoder/attn_layers.1/Constant_32_output_0": "c000303", + "/text_encoder/attn_encoder/attn_layers.1/Constant_33_output_0": "c000304", + "/text_encoder/attn_encoder/attn_layers.1/Constant_34_output_0": "c000305", + "/text_encoder/attn_encoder/attn_layers.1/Constant_35_output_0": "c000306", + "/text_encoder/attn_encoder/attn_layers.1/Constant_36_output_0": "c000307", + "/text_encoder/attn_encoder/attn_layers.1/Constant_37_output_0": "c000308", + "/text_encoder/attn_encoder/attn_layers.1/Constant_38_output_0": "c000309", + "/text_encoder/attn_encoder/attn_layers.1/Constant_39_output_0": "c000310", + "/text_encoder/attn_encoder/attn_layers.1/Constant_40_output_0": "c000311", + "/text_encoder/attn_encoder/attn_layers.1/Constant_41_output_0": "c000312", + "/text_encoder/attn_encoder/attn_layers.1/Constant_42_output_0": "c000313", + "/text_encoder/attn_encoder/attn_layers.1/Constant_43_output_0": "c000314", + "/text_encoder/attn_encoder/attn_layers.1/Constant_44_output_0": "c000315", + "/text_encoder/attn_encoder/attn_layers.1/Constant_45_output_0": "c000316", + "/text_encoder/attn_encoder/attn_layers.1/Constant_46_output_0": "c000317", + "/text_encoder/attn_encoder/attn_layers.1/Constant_47_output_0": "c000318", + "/text_encoder/attn_encoder/attn_layers.1/Constant_48_output_0": "c000319", + "/text_encoder/attn_encoder/attn_layers.1/Constant_49_output_0": "c000320", + "/text_encoder/attn_encoder/attn_layers.1/Constant_50_output_0": "c000321", + "/text_encoder/attn_encoder/attn_layers.1/Constant_51_output_0": "c000322", + "/text_encoder/attn_encoder/attn_layers.1/Constant_52_output_0": "c000323", + "/text_encoder/attn_encoder/attn_layers.1/Constant_53_output_0": "c000324", + "/text_encoder/attn_encoder/attn_layers.1/Constant_54_output_0": "c000325", + "/text_encoder/attn_encoder/attn_layers.1/Constant_55_output_0": "c000326", + "/text_encoder/attn_encoder/attn_layers.1/Constant_56_output_0": "c000327", + "/text_encoder/attn_encoder/attn_layers.1/Constant_57_output_0": "c000328", + "onnx::Unsqueeze_1903": "c000329", + "onnx::Unsqueeze_1905": "c000330", + "onnx::Unsqueeze_1907": "c000331", + "/text_encoder/attn_encoder/attn_layers.1/Constant_58_output_0": "c000332", + "/text_encoder/attn_encoder/attn_layers.1/Constant_59_output_0": "c000333", + "onnx::Unsqueeze_1915": "c000334", + "/text_encoder/attn_encoder/attn_layers.1/Constant_60_output_0": "c000335", + "/text_encoder/attn_encoder/attn_layers.1/Constant_61_output_0": "c000336", + "/text_encoder/attn_encoder/attn_layers.1/Constant_62_output_0": "c000337", + "/text_encoder/attn_encoder/attn_layers.1/Constant_63_output_0": "c000338", + "/text_encoder/attn_encoder/attn_layers.1/Constant_64_output_0": "c000339", + "onnx::Unsqueeze_1928": "c000340", + "/text_encoder/attn_encoder/attn_layers.1/Constant_65_output_0": "c000341", + "/text_encoder/attn_encoder/attn_layers.1/Constant_66_output_0": "c000342", + "/text_encoder/attn_encoder/attn_layers.1/Constant_67_output_0": "c000343", + "/text_encoder/attn_encoder/attn_layers.1/Constant_68_output_0": "c000344", + "/text_encoder/attn_encoder/attn_layers.1/Constant_69_output_0": "c000345", + "/text_encoder/attn_encoder/attn_layers.1/Constant_70_output_0": "c000346", + "/text_encoder/attn_encoder/attn_layers.1/Constant_71_output_0": "c000347", + "/text_encoder/attn_encoder/attn_layers.1/Constant_72_output_0": "c000348", + "/text_encoder/attn_encoder/attn_layers.1/Constant_73_output_0": "c000349", + "/text_encoder/attn_encoder/attn_layers.1/Constant_74_output_0": "c000350", + "/text_encoder/attn_encoder/attn_layers.1/Constant_75_output_0": "c000351", + "/text_encoder/attn_encoder/attn_layers.1/Constant_76_output_0": "c000352", + "/text_encoder/attn_encoder/attn_layers.1/Constant_77_output_0": "c000353", + "/text_encoder/attn_encoder/attn_layers.1/Constant_78_output_0": "c000354", + "onnx::Unsqueeze_1965": "c000355", + "onnx::Unsqueeze_1967": "c000356", + "onnx::Unsqueeze_1969": "c000357", + "onnx::Unsqueeze_1971": "c000358", + "/text_encoder/attn_encoder/attn_layers.1/Constant_79_output_0": "c000359", + "/text_encoder/attn_encoder/attn_layers.1/Constant_80_output_0": "c000360", + "/text_encoder/attn_encoder/attn_layers.1/Constant_81_output_0": "c000361", + "/text_encoder/attn_encoder/attn_layers.1/Constant_82_output_0": "c000362", + "/text_encoder/attn_encoder/attn_layers.1/Constant_83_output_0": "c000363", + "/text_encoder/attn_encoder/attn_layers.1/Constant_84_output_0": "c000364", + "/text_encoder/attn_encoder/attn_layers.1/Constant_85_output_0": "c000365", + "/text_encoder/attn_encoder/attn_layers.1/Constant_86_output_0": "c000366", + "/text_encoder/attn_encoder/attn_layers.1/Constant_87_output_0": "c000367", + "/text_encoder/attn_encoder/attn_layers.1/Constant_88_output_0": "c000368", + "/text_encoder/attn_encoder/attn_layers.1/Constant_89_output_0": "c000369", + "/text_encoder/attn_encoder/attn_layers.1/Constant_90_output_0": "c000370", + "/text_encoder/attn_encoder/attn_layers.1/Constant_91_output_0": "c000371", + "/text_encoder/attn_encoder/attn_layers.1/Constant_92_output_0": "c000372", + "onnx::Unsqueeze_2012": "c000373", + "/text_encoder/attn_encoder/attn_layers.1/Constant_93_output_0": "c000374", + "/text_encoder/attn_encoder/attn_layers.1/Constant_94_output_0": "c000375", + "/text_encoder/attn_encoder/attn_layers.1/Constant_95_output_0": "c000376", + "/text_encoder/attn_encoder/attn_layers.1/Constant_96_output_0": "c000377", + "/text_encoder/attn_encoder/attn_layers.1/Constant_97_output_0": "c000378", + "/text_encoder/attn_encoder/attn_layers.1/Constant_98_output_0": "c000379", + "/text_encoder/attn_encoder/attn_layers.1/Constant_99_output_0": "c000380", + "onnx::Unsqueeze_2029": "c000381", + "/text_encoder/attn_encoder/attn_layers.1/Constant_100_output_0": "c000382", + "/text_encoder/attn_encoder/attn_layers.1/Constant_101_output_0": "c000383", + "/text_encoder/attn_encoder/attn_layers.1/Constant_102_output_0": "c000384", + "/text_encoder/attn_encoder/attn_layers.1/Constant_103_output_0": "c000385", + "/text_encoder/attn_encoder/attn_layers.1/Constant_104_output_0": "c000386", + "/text_encoder/attn_encoder/attn_layers.1/Constant_105_output_0": "c000387", + "/text_encoder/attn_encoder/attn_layers.1/Constant_106_output_0": "c000388", + "/text_encoder/attn_encoder/attn_layers.1/Constant_107_output_0": "c000389", + "/text_encoder/attn_encoder/attn_layers.1/Constant_108_output_0": "c000390", + "/text_encoder/attn_encoder/attn_layers.1/Constant_109_output_0": "c000391", + "/text_encoder/attn_encoder/attn_layers.1/Constant_110_output_0": "c000392", + "/text_encoder/attn_encoder/attn_layers.1/Constant_111_output_0": "c000393", + "/text_encoder/attn_encoder/attn_layers.1/Constant_112_output_0": "c000394", + "/text_encoder/attn_encoder/attn_layers.1/Constant_113_output_0": "c000395", + "/text_encoder/attn_encoder/attn_layers.1/Constant_114_output_0": "c000396", + "onnx::Unsqueeze_2070": "c000397", + "onnx::Unsqueeze_2072": "c000398", + "onnx::Unsqueeze_2074": "c000399", + "onnx::Unsqueeze_2078": "c000400", + "/text_encoder/attn_encoder/attn_layers.1/Constant_115_output_0": "c000401", + "/text_encoder/attn_encoder/attn_layers.1/Constant_116_output_0": "c000402", + "/text_encoder/attn_encoder/attn_layers.1/Constant_117_output_0": "c000403", + "/text_encoder/attn_encoder/attn_layers.1/Constant_118_output_0": "c000404", + "/text_encoder/attn_encoder/attn_layers.1/Constant_119_output_0": "c000405", + "onnx::Unsqueeze_2091": "c000406", + "/text_encoder/attn_encoder/attn_layers.1/Constant_120_output_0": "c000407", + "/text_encoder/attn_encoder/attn_layers.1/Constant_121_output_0": "c000408", + "/text_encoder/attn_encoder/attn_layers.1/Constant_122_output_0": "c000409", + "/text_encoder/attn_encoder/attn_layers.1/Constant_123_output_0": "c000410", + "/text_encoder/attn_encoder/attn_layers.1/Constant_124_output_0": "c000411", + "/text_encoder/attn_encoder/attn_layers.1/Constant_125_output_0": "c000412", + "/text_encoder/attn_encoder/attn_layers.1/Constant_126_output_0": "c000413", + "/text_encoder/attn_encoder/attn_layers.1/Constant_127_output_0": "c000414", + "/text_encoder/attn_encoder/attn_layers.1/Constant_128_output_0": "c000415", + "/text_encoder/attn_encoder/attn_layers.1/Constant_129_output_0": "c000416", + "/text_encoder/attn_encoder/attn_layers.1/Constant_130_output_0": "c000417", + "/text_encoder/attn_encoder/attn_layers.1/Constant_131_output_0": "c000418", + "/text_encoder/attn_encoder/attn_layers.1/Constant_132_output_0": "c000419", + "/text_encoder/attn_encoder/attn_layers.1/Constant_133_output_0": "c000420", + "onnx::Unsqueeze_2128": "c000421", + "onnx::Unsqueeze_2130": "c000422", + "onnx::Unsqueeze_2132": "c000423", + "onnx::Unsqueeze_2134": "c000424", + "/text_encoder/attn_encoder/attn_layers.1/Constant_134_output_0": "c000425", + "/text_encoder/attn_encoder/attn_layers.1/Constant_135_output_0": "c000426", + "/text_encoder/attn_encoder/attn_layers.1/Constant_136_output_0": "c000427", + "/text_encoder/attn_encoder/attn_layers.1/Constant_137_output_0": "c000428", + "/text_encoder/attn_encoder/attn_layers.1/Constant_138_output_0": "c000429", + "/text_encoder/attn_encoder/attn_layers.1/Constant_139_output_0": "c000430", + "/text_encoder/attn_encoder/attn_layers.1/Constant_140_output_0": "c000431", + "/text_encoder/attn_encoder/attn_layers.1/Constant_141_output_0": "c000432", + "/text_encoder/attn_encoder/attn_layers.1/Constant_142_output_0": "c000433", + "/text_encoder/attn_encoder/attn_layers.1/Constant_143_output_0": "c000434", + "/text_encoder/attn_encoder/attn_layers.1/Constant_144_output_0": "c000435", + "/text_encoder/attn_encoder/attn_layers.1/Constant_145_output_0": "c000436", + "/text_encoder/attn_encoder/attn_layers.1/Constant_146_output_0": "c000437", + "/text_encoder/attn_encoder/attn_layers.1/Constant_147_output_0": "c000438", + "/text_encoder/attn_encoder/attn_layers.1/Constant_148_output_0": "c000439", + "/text_encoder/attn_encoder/attn_layers.1/Constant_149_output_0": "c000440", + "/text_encoder/attn_encoder/attn_layers.1/Constant_150_output_0": "c000441", + "onnx::Unsqueeze_2183": "c000442", + "onnx::Unsqueeze_2185": "c000443", + "onnx::Unsqueeze_2187": "c000444", + "/text_encoder/attn_encoder/attn_layers.2/Constant_output_0": "c000445", + "/text_encoder/attn_encoder/attn_layers.2/Constant_1_output_0": "c000446", + "/text_encoder/attn_encoder/attn_layers.2/Constant_2_output_0": "c000447", + "/text_encoder/attn_encoder/attn_layers.2/Constant_3_output_0": "c000448", + "onnx::Unsqueeze_2221": "c000449", + "/text_encoder/attn_encoder/attn_layers.2/Constant_4_output_0": "c000450", + "/text_encoder/attn_encoder/attn_layers.2/Constant_5_output_0": "c000451", + "onnx::Unsqueeze_2227": "c000452", + "onnx::Unsqueeze_2232": "c000453", + "/text_encoder/attn_encoder/attn_layers.2/Constant_6_output_0": "c000454", + "/text_encoder/attn_encoder/attn_layers.2/Constant_7_output_0": "c000455", + "onnx::Unsqueeze_2238": "c000456", + "onnx::Unsqueeze_2241": "c000457", + "/text_encoder/attn_encoder/attn_layers.2/Constant_8_output_0": "c000458", + "/text_encoder/attn_encoder/attn_layers.2/Constant_9_output_0": "c000459", + "onnx::Unsqueeze_2247": "c000460", + "/text_encoder/attn_encoder/attn_layers.2/Constant_10_output_0": "c000461", + "/text_encoder/attn_encoder/attn_layers.2/Constant_11_output_0": "c000462", + "/text_encoder/attn_encoder/attn_layers.2/Constant_12_output_0": "c000463", + "/text_encoder/attn_encoder/attn_layers.2/Constant_13_output_0": "c000464", + "/text_encoder/attn_encoder/attn_layers.2/Constant_14_output_0": "c000465", + "/text_encoder/attn_encoder/attn_layers.2/Constant_15_output_0": "c000466", + "/text_encoder/attn_encoder/attn_layers.2/Constant_16_output_0": "c000467", + "/text_encoder/attn_encoder/attn_layers.2/Constant_17_output_0": "c000468", + "/text_encoder/attn_encoder/attn_layers.2/Constant_18_output_0": "c000469", + "onnx::Unsqueeze_2277": "c000470", + "onnx::Unsqueeze_2279": "c000471", + "/text_encoder/attn_encoder/attn_layers.2/Constant_19_output_0": "c000472", + "/text_encoder/attn_encoder/attn_layers.2/Constant_20_output_0": "c000473", + "/text_encoder/attn_encoder/attn_layers.2/Constant_21_output_0": "c000474", + "/text_encoder/attn_encoder/attn_layers.2/Constant_22_output_0": "c000475", + "onnx::Unsqueeze_2290": "c000476", + "onnx::Unsqueeze_2292": "c000477", + "/text_encoder/attn_encoder/attn_layers.2/Constant_23_output_0": "c000478", + "/text_encoder/attn_encoder/attn_layers.2/Constant_24_output_0": "c000479", + "/text_encoder/attn_encoder/attn_layers.2/Constant_25_output_0": "c000480", + "/text_encoder/attn_encoder/attn_layers.2/Constant_26_output_0": "c000481", + "onnx::Unsqueeze_2303": "c000482", + "onnx::Unsqueeze_2305": "c000483", + "/text_encoder/attn_encoder/attn_layers.2/Constant_27_output_0": "c000484", + "/text_encoder/attn_encoder/attn_layers.2/Constant_28_output_0": "c000485", + "/text_encoder/attn_encoder/attn_layers.2/Constant_29_output_0": "c000486", + "/text_encoder/attn_encoder/attn_layers.2/Constant_30_output_0": "c000487", + "onnx::Unsqueeze_2316": "c000488", + "onnx::Unsqueeze_2318": "c000489", + "/text_encoder/attn_encoder/attn_layers.2/Constant_31_output_0": "c000490", + "/text_encoder/attn_encoder/attn_layers.2/Constant_32_output_0": "c000491", + "/text_encoder/attn_encoder/attn_layers.2/Constant_33_output_0": "c000492", + "/text_encoder/attn_encoder/attn_layers.2/Constant_34_output_0": "c000493", + "/text_encoder/attn_encoder/attn_layers.2/Constant_35_output_0": "c000494", + "/text_encoder/attn_encoder/attn_layers.2/Constant_36_output_0": "c000495", + "/text_encoder/attn_encoder/attn_layers.2/Constant_37_output_0": "c000496", + "/text_encoder/attn_encoder/attn_layers.2/Constant_38_output_0": "c000497", + "/text_encoder/attn_encoder/attn_layers.2/Constant_39_output_0": "c000498", + "/text_encoder/attn_encoder/attn_layers.2/Constant_40_output_0": "c000499", + "/text_encoder/attn_encoder/attn_layers.2/Constant_41_output_0": "c000500", + "/text_encoder/attn_encoder/attn_layers.2/Constant_42_output_0": "c000501", + "/text_encoder/attn_encoder/attn_layers.2/Constant_43_output_0": "c000502", + "/text_encoder/attn_encoder/attn_layers.2/Constant_44_output_0": "c000503", + "/text_encoder/attn_encoder/attn_layers.2/Constant_45_output_0": "c000504", + "/text_encoder/attn_encoder/attn_layers.2/Constant_46_output_0": "c000505", + "/text_encoder/attn_encoder/attn_layers.2/Constant_47_output_0": "c000506", + "/text_encoder/attn_encoder/attn_layers.2/Constant_48_output_0": "c000507", + "/text_encoder/attn_encoder/attn_layers.2/Constant_49_output_0": "c000508", + "/text_encoder/attn_encoder/attn_layers.2/Constant_50_output_0": "c000509", + "/text_encoder/attn_encoder/attn_layers.2/Constant_51_output_0": "c000510", + "/text_encoder/attn_encoder/attn_layers.2/Constant_52_output_0": "c000511", + "/text_encoder/attn_encoder/attn_layers.2/Constant_53_output_0": "c000512", + "/text_encoder/attn_encoder/attn_layers.2/Constant_54_output_0": "c000513", + "/text_encoder/attn_encoder/attn_layers.2/Constant_55_output_0": "c000514", + "/text_encoder/attn_encoder/attn_layers.2/Constant_56_output_0": "c000515", + "/text_encoder/attn_encoder/attn_layers.2/Constant_57_output_0": "c000516", + "onnx::Unsqueeze_2394": "c000517", + "onnx::Unsqueeze_2396": "c000518", + "onnx::Unsqueeze_2398": "c000519", + "/text_encoder/attn_encoder/attn_layers.2/Constant_58_output_0": "c000520", + "/text_encoder/attn_encoder/attn_layers.2/Constant_59_output_0": "c000521", + "onnx::Unsqueeze_2406": "c000522", + "/text_encoder/attn_encoder/attn_layers.2/Constant_60_output_0": "c000523", + "/text_encoder/attn_encoder/attn_layers.2/Constant_61_output_0": "c000524", + "/text_encoder/attn_encoder/attn_layers.2/Constant_62_output_0": "c000525", + "/text_encoder/attn_encoder/attn_layers.2/Constant_63_output_0": "c000526", + "/text_encoder/attn_encoder/attn_layers.2/Constant_64_output_0": "c000527", + "onnx::Unsqueeze_2419": "c000528", + "/text_encoder/attn_encoder/attn_layers.2/Constant_65_output_0": "c000529", + "/text_encoder/attn_encoder/attn_layers.2/Constant_66_output_0": "c000530", + "/text_encoder/attn_encoder/attn_layers.2/Constant_67_output_0": "c000531", + "/text_encoder/attn_encoder/attn_layers.2/Constant_68_output_0": "c000532", + "/text_encoder/attn_encoder/attn_layers.2/Constant_69_output_0": "c000533", + "/text_encoder/attn_encoder/attn_layers.2/Constant_70_output_0": "c000534", + "/text_encoder/attn_encoder/attn_layers.2/Constant_71_output_0": "c000535", + "/text_encoder/attn_encoder/attn_layers.2/Constant_72_output_0": "c000536", + "/text_encoder/attn_encoder/attn_layers.2/Constant_73_output_0": "c000537", + "/text_encoder/attn_encoder/attn_layers.2/Constant_74_output_0": "c000538", + "/text_encoder/attn_encoder/attn_layers.2/Constant_75_output_0": "c000539", + "/text_encoder/attn_encoder/attn_layers.2/Constant_76_output_0": "c000540", + "/text_encoder/attn_encoder/attn_layers.2/Constant_77_output_0": "c000541", + "/text_encoder/attn_encoder/attn_layers.2/Constant_78_output_0": "c000542", + "onnx::Unsqueeze_2456": "c000543", + "onnx::Unsqueeze_2458": "c000544", + "onnx::Unsqueeze_2460": "c000545", + "onnx::Unsqueeze_2462": "c000546", + "/text_encoder/attn_encoder/attn_layers.2/Constant_79_output_0": "c000547", + "/text_encoder/attn_encoder/attn_layers.2/Constant_80_output_0": "c000548", + "/text_encoder/attn_encoder/attn_layers.2/Constant_81_output_0": "c000549", + "/text_encoder/attn_encoder/attn_layers.2/Constant_82_output_0": "c000550", + "/text_encoder/attn_encoder/attn_layers.2/Constant_83_output_0": "c000551", + "/text_encoder/attn_encoder/attn_layers.2/Constant_84_output_0": "c000552", + "/text_encoder/attn_encoder/attn_layers.2/Constant_85_output_0": "c000553", + "/text_encoder/attn_encoder/attn_layers.2/Constant_86_output_0": "c000554", + "/text_encoder/attn_encoder/attn_layers.2/Constant_87_output_0": "c000555", + "/text_encoder/attn_encoder/attn_layers.2/Constant_88_output_0": "c000556", + "/text_encoder/attn_encoder/attn_layers.2/Constant_89_output_0": "c000557", + "/text_encoder/attn_encoder/attn_layers.2/Constant_90_output_0": "c000558", + "/text_encoder/attn_encoder/attn_layers.2/Constant_91_output_0": "c000559", + "/text_encoder/attn_encoder/attn_layers.2/Constant_92_output_0": "c000560", + "onnx::Unsqueeze_2503": "c000561", + "/text_encoder/attn_encoder/attn_layers.2/Constant_93_output_0": "c000562", + "/text_encoder/attn_encoder/attn_layers.2/Constant_94_output_0": "c000563", + "/text_encoder/attn_encoder/attn_layers.2/Constant_95_output_0": "c000564", + "/text_encoder/attn_encoder/attn_layers.2/Constant_96_output_0": "c000565", + "/text_encoder/attn_encoder/attn_layers.2/Constant_97_output_0": "c000566", + "/text_encoder/attn_encoder/attn_layers.2/Constant_98_output_0": "c000567", + "/text_encoder/attn_encoder/attn_layers.2/Constant_99_output_0": "c000568", + "onnx::Unsqueeze_2520": "c000569", + "/text_encoder/attn_encoder/attn_layers.2/Constant_100_output_0": "c000570", + "/text_encoder/attn_encoder/attn_layers.2/Constant_101_output_0": "c000571", + "/text_encoder/attn_encoder/attn_layers.2/Constant_102_output_0": "c000572", + "/text_encoder/attn_encoder/attn_layers.2/Constant_103_output_0": "c000573", + "/text_encoder/attn_encoder/attn_layers.2/Constant_104_output_0": "c000574", + "/text_encoder/attn_encoder/attn_layers.2/Constant_105_output_0": "c000575", + "/text_encoder/attn_encoder/attn_layers.2/Constant_106_output_0": "c000576", + "/text_encoder/attn_encoder/attn_layers.2/Constant_107_output_0": "c000577", + "/text_encoder/attn_encoder/attn_layers.2/Constant_108_output_0": "c000578", + "/text_encoder/attn_encoder/attn_layers.2/Constant_109_output_0": "c000579", + "/text_encoder/attn_encoder/attn_layers.2/Constant_110_output_0": "c000580", + "/text_encoder/attn_encoder/attn_layers.2/Constant_111_output_0": "c000581", + "/text_encoder/attn_encoder/attn_layers.2/Constant_112_output_0": "c000582", + "/text_encoder/attn_encoder/attn_layers.2/Constant_113_output_0": "c000583", + "/text_encoder/attn_encoder/attn_layers.2/Constant_114_output_0": "c000584", + "onnx::Unsqueeze_2561": "c000585", + "onnx::Unsqueeze_2563": "c000586", + "onnx::Unsqueeze_2565": "c000587", + "onnx::Unsqueeze_2569": "c000588", + "/text_encoder/attn_encoder/attn_layers.2/Constant_115_output_0": "c000589", + "/text_encoder/attn_encoder/attn_layers.2/Constant_116_output_0": "c000590", + "/text_encoder/attn_encoder/attn_layers.2/Constant_117_output_0": "c000591", + "/text_encoder/attn_encoder/attn_layers.2/Constant_118_output_0": "c000592", + "/text_encoder/attn_encoder/attn_layers.2/Constant_119_output_0": "c000593", + "onnx::Unsqueeze_2582": "c000594", + "/text_encoder/attn_encoder/attn_layers.2/Constant_120_output_0": "c000595", + "/text_encoder/attn_encoder/attn_layers.2/Constant_121_output_0": "c000596", + "/text_encoder/attn_encoder/attn_layers.2/Constant_122_output_0": "c000597", + "/text_encoder/attn_encoder/attn_layers.2/Constant_123_output_0": "c000598", + "/text_encoder/attn_encoder/attn_layers.2/Constant_124_output_0": "c000599", + "/text_encoder/attn_encoder/attn_layers.2/Constant_125_output_0": "c000600", + "/text_encoder/attn_encoder/attn_layers.2/Constant_126_output_0": "c000601", + "/text_encoder/attn_encoder/attn_layers.2/Constant_127_output_0": "c000602", + "/text_encoder/attn_encoder/attn_layers.2/Constant_128_output_0": "c000603", + "/text_encoder/attn_encoder/attn_layers.2/Constant_129_output_0": "c000604", + "/text_encoder/attn_encoder/attn_layers.2/Constant_130_output_0": "c000605", + "/text_encoder/attn_encoder/attn_layers.2/Constant_131_output_0": "c000606", + "/text_encoder/attn_encoder/attn_layers.2/Constant_132_output_0": "c000607", + "/text_encoder/attn_encoder/attn_layers.2/Constant_133_output_0": "c000608", + "onnx::Unsqueeze_2619": "c000609", + "onnx::Unsqueeze_2621": "c000610", + "onnx::Unsqueeze_2623": "c000611", + "onnx::Unsqueeze_2625": "c000612", + "/text_encoder/attn_encoder/attn_layers.2/Constant_134_output_0": "c000613", + "/text_encoder/attn_encoder/attn_layers.2/Constant_135_output_0": "c000614", + "/text_encoder/attn_encoder/attn_layers.2/Constant_136_output_0": "c000615", + "/text_encoder/attn_encoder/attn_layers.2/Constant_137_output_0": "c000616", + "/text_encoder/attn_encoder/attn_layers.2/Constant_138_output_0": "c000617", + "/text_encoder/attn_encoder/attn_layers.2/Constant_139_output_0": "c000618", + "/text_encoder/attn_encoder/attn_layers.2/Constant_140_output_0": "c000619", + "/text_encoder/attn_encoder/attn_layers.2/Constant_141_output_0": "c000620", + "/text_encoder/attn_encoder/attn_layers.2/Constant_142_output_0": "c000621", + "/text_encoder/attn_encoder/attn_layers.2/Constant_143_output_0": "c000622", + "/text_encoder/attn_encoder/attn_layers.2/Constant_144_output_0": "c000623", + "/text_encoder/attn_encoder/attn_layers.2/Constant_145_output_0": "c000624", + "/text_encoder/attn_encoder/attn_layers.2/Constant_146_output_0": "c000625", + "/text_encoder/attn_encoder/attn_layers.2/Constant_147_output_0": "c000626", + "/text_encoder/attn_encoder/attn_layers.2/Constant_148_output_0": "c000627", + "/text_encoder/attn_encoder/attn_layers.2/Constant_149_output_0": "c000628", + "/text_encoder/attn_encoder/attn_layers.2/Constant_150_output_0": "c000629", + "onnx::Unsqueeze_2674": "c000630", + "onnx::Unsqueeze_2676": "c000631", + "onnx::Unsqueeze_2678": "c000632", + "/text_encoder/attn_encoder/attn_layers.3/Constant_output_0": "c000633", + "/text_encoder/attn_encoder/attn_layers.3/Constant_1_output_0": "c000634", + "/text_encoder/attn_encoder/attn_layers.3/Constant_2_output_0": "c000635", + "/text_encoder/attn_encoder/attn_layers.3/Constant_3_output_0": "c000636", + "onnx::Unsqueeze_2712": "c000637", + "/text_encoder/attn_encoder/attn_layers.3/Constant_4_output_0": "c000638", + "/text_encoder/attn_encoder/attn_layers.3/Constant_5_output_0": "c000639", + "onnx::Unsqueeze_2718": "c000640", + "onnx::Unsqueeze_2723": "c000641", + "/text_encoder/attn_encoder/attn_layers.3/Constant_6_output_0": "c000642", + "/text_encoder/attn_encoder/attn_layers.3/Constant_7_output_0": "c000643", + "onnx::Unsqueeze_2729": "c000644", + "onnx::Unsqueeze_2732": "c000645", + "/text_encoder/attn_encoder/attn_layers.3/Constant_8_output_0": "c000646", + "/text_encoder/attn_encoder/attn_layers.3/Constant_9_output_0": "c000647", + "onnx::Unsqueeze_2738": "c000648", + "/text_encoder/attn_encoder/attn_layers.3/Constant_10_output_0": "c000649", + "/text_encoder/attn_encoder/attn_layers.3/Constant_11_output_0": "c000650", + "/text_encoder/attn_encoder/attn_layers.3/Constant_12_output_0": "c000651", + "/text_encoder/attn_encoder/attn_layers.3/Constant_13_output_0": "c000652", + "/text_encoder/attn_encoder/attn_layers.3/Constant_14_output_0": "c000653", + "/text_encoder/attn_encoder/attn_layers.3/Constant_15_output_0": "c000654", + "/text_encoder/attn_encoder/attn_layers.3/Constant_16_output_0": "c000655", + "/text_encoder/attn_encoder/attn_layers.3/Constant_17_output_0": "c000656", + "/text_encoder/attn_encoder/attn_layers.3/Constant_18_output_0": "c000657", + "onnx::Unsqueeze_2768": "c000658", + "onnx::Unsqueeze_2770": "c000659", + "/text_encoder/attn_encoder/attn_layers.3/Constant_19_output_0": "c000660", + "/text_encoder/attn_encoder/attn_layers.3/Constant_20_output_0": "c000661", + "/text_encoder/attn_encoder/attn_layers.3/Constant_21_output_0": "c000662", + "/text_encoder/attn_encoder/attn_layers.3/Constant_22_output_0": "c000663", + "onnx::Unsqueeze_2781": "c000664", + "onnx::Unsqueeze_2783": "c000665", + "/text_encoder/attn_encoder/attn_layers.3/Constant_23_output_0": "c000666", + "/text_encoder/attn_encoder/attn_layers.3/Constant_24_output_0": "c000667", + "/text_encoder/attn_encoder/attn_layers.3/Constant_25_output_0": "c000668", + "/text_encoder/attn_encoder/attn_layers.3/Constant_26_output_0": "c000669", + "onnx::Unsqueeze_2794": "c000670", + "onnx::Unsqueeze_2796": "c000671", + "/text_encoder/attn_encoder/attn_layers.3/Constant_27_output_0": "c000672", + "/text_encoder/attn_encoder/attn_layers.3/Constant_28_output_0": "c000673", + "/text_encoder/attn_encoder/attn_layers.3/Constant_29_output_0": "c000674", + "/text_encoder/attn_encoder/attn_layers.3/Constant_30_output_0": "c000675", + "onnx::Unsqueeze_2807": "c000676", + "onnx::Unsqueeze_2809": "c000677", + "/text_encoder/attn_encoder/attn_layers.3/Constant_31_output_0": "c000678", + "/text_encoder/attn_encoder/attn_layers.3/Constant_32_output_0": "c000679", + "/text_encoder/attn_encoder/attn_layers.3/Constant_33_output_0": "c000680", + "/text_encoder/attn_encoder/attn_layers.3/Constant_34_output_0": "c000681", + "/text_encoder/attn_encoder/attn_layers.3/Constant_35_output_0": "c000682", + "/text_encoder/attn_encoder/attn_layers.3/Constant_36_output_0": "c000683", + "/text_encoder/attn_encoder/attn_layers.3/Constant_37_output_0": "c000684", + "/text_encoder/attn_encoder/attn_layers.3/Constant_38_output_0": "c000685", + "/text_encoder/attn_encoder/attn_layers.3/Constant_39_output_0": "c000686", + "/text_encoder/attn_encoder/attn_layers.3/Constant_40_output_0": "c000687", + "/text_encoder/attn_encoder/attn_layers.3/Constant_41_output_0": "c000688", + "/text_encoder/attn_encoder/attn_layers.3/Constant_42_output_0": "c000689", + "/text_encoder/attn_encoder/attn_layers.3/Constant_43_output_0": "c000690", + "/text_encoder/attn_encoder/attn_layers.3/Constant_44_output_0": "c000691", + "/text_encoder/attn_encoder/attn_layers.3/Constant_45_output_0": "c000692", + "/text_encoder/attn_encoder/attn_layers.3/Constant_46_output_0": "c000693", + "/text_encoder/attn_encoder/attn_layers.3/Constant_47_output_0": "c000694", + "/text_encoder/attn_encoder/attn_layers.3/Constant_48_output_0": "c000695", + "/text_encoder/attn_encoder/attn_layers.3/Constant_49_output_0": "c000696", + "/text_encoder/attn_encoder/attn_layers.3/Constant_50_output_0": "c000697", + "/text_encoder/attn_encoder/attn_layers.3/Constant_51_output_0": "c000698", + "/text_encoder/attn_encoder/attn_layers.3/Constant_52_output_0": "c000699", + "/text_encoder/attn_encoder/attn_layers.3/Constant_53_output_0": "c000700", + "/text_encoder/attn_encoder/attn_layers.3/Constant_54_output_0": "c000701", + "/text_encoder/attn_encoder/attn_layers.3/Constant_55_output_0": "c000702", + "/text_encoder/attn_encoder/attn_layers.3/Constant_56_output_0": "c000703", + "/text_encoder/attn_encoder/attn_layers.3/Constant_57_output_0": "c000704", + "onnx::Unsqueeze_2885": "c000705", + "onnx::Unsqueeze_2887": "c000706", + "onnx::Unsqueeze_2889": "c000707", + "/text_encoder/attn_encoder/attn_layers.3/Constant_58_output_0": "c000708", + "/text_encoder/attn_encoder/attn_layers.3/Constant_59_output_0": "c000709", + "onnx::Unsqueeze_2897": "c000710", + "/text_encoder/attn_encoder/attn_layers.3/Constant_60_output_0": "c000711", + "/text_encoder/attn_encoder/attn_layers.3/Constant_61_output_0": "c000712", + "/text_encoder/attn_encoder/attn_layers.3/Constant_62_output_0": "c000713", + "/text_encoder/attn_encoder/attn_layers.3/Constant_63_output_0": "c000714", + "/text_encoder/attn_encoder/attn_layers.3/Constant_64_output_0": "c000715", + "onnx::Unsqueeze_2910": "c000716", + "/text_encoder/attn_encoder/attn_layers.3/Constant_65_output_0": "c000717", + "/text_encoder/attn_encoder/attn_layers.3/Constant_66_output_0": "c000718", + "/text_encoder/attn_encoder/attn_layers.3/Constant_67_output_0": "c000719", + "/text_encoder/attn_encoder/attn_layers.3/Constant_68_output_0": "c000720", + "/text_encoder/attn_encoder/attn_layers.3/Constant_69_output_0": "c000721", + "/text_encoder/attn_encoder/attn_layers.3/Constant_70_output_0": "c000722", + "/text_encoder/attn_encoder/attn_layers.3/Constant_71_output_0": "c000723", + "/text_encoder/attn_encoder/attn_layers.3/Constant_72_output_0": "c000724", + "/text_encoder/attn_encoder/attn_layers.3/Constant_73_output_0": "c000725", + "/text_encoder/attn_encoder/attn_layers.3/Constant_74_output_0": "c000726", + "/text_encoder/attn_encoder/attn_layers.3/Constant_75_output_0": "c000727", + "/text_encoder/attn_encoder/attn_layers.3/Constant_76_output_0": "c000728", + "/text_encoder/attn_encoder/attn_layers.3/Constant_77_output_0": "c000729", + "/text_encoder/attn_encoder/attn_layers.3/Constant_78_output_0": "c000730", + "onnx::Unsqueeze_2947": "c000731", + "onnx::Unsqueeze_2949": "c000732", + "onnx::Unsqueeze_2951": "c000733", + "onnx::Unsqueeze_2953": "c000734", + "/text_encoder/attn_encoder/attn_layers.3/Constant_79_output_0": "c000735", + "/text_encoder/attn_encoder/attn_layers.3/Constant_80_output_0": "c000736", + "/text_encoder/attn_encoder/attn_layers.3/Constant_81_output_0": "c000737", + "/text_encoder/attn_encoder/attn_layers.3/Constant_82_output_0": "c000738", + "/text_encoder/attn_encoder/attn_layers.3/Constant_83_output_0": "c000739", + "/text_encoder/attn_encoder/attn_layers.3/Constant_84_output_0": "c000740", + "/text_encoder/attn_encoder/attn_layers.3/Constant_85_output_0": "c000741", + "/text_encoder/attn_encoder/attn_layers.3/Constant_86_output_0": "c000742", + "/text_encoder/attn_encoder/attn_layers.3/Constant_87_output_0": "c000743", + "/text_encoder/attn_encoder/attn_layers.3/Constant_88_output_0": "c000744", + "/text_encoder/attn_encoder/attn_layers.3/Constant_89_output_0": "c000745", + "/text_encoder/attn_encoder/attn_layers.3/Constant_90_output_0": "c000746", + "/text_encoder/attn_encoder/attn_layers.3/Constant_91_output_0": "c000747", + "/text_encoder/attn_encoder/attn_layers.3/Constant_92_output_0": "c000748", + "onnx::Unsqueeze_2994": "c000749", + "/text_encoder/attn_encoder/attn_layers.3/Constant_93_output_0": "c000750", + "/text_encoder/attn_encoder/attn_layers.3/Constant_94_output_0": "c000751", + "/text_encoder/attn_encoder/attn_layers.3/Constant_95_output_0": "c000752", + "/text_encoder/attn_encoder/attn_layers.3/Constant_96_output_0": "c000753", + "/text_encoder/attn_encoder/attn_layers.3/Constant_97_output_0": "c000754", + "/text_encoder/attn_encoder/attn_layers.3/Constant_98_output_0": "c000755", + "/text_encoder/attn_encoder/attn_layers.3/Constant_99_output_0": "c000756", + "onnx::Unsqueeze_3011": "c000757", + "/text_encoder/attn_encoder/attn_layers.3/Constant_100_output_0": "c000758", + "/text_encoder/attn_encoder/attn_layers.3/Constant_101_output_0": "c000759", + "/text_encoder/attn_encoder/attn_layers.3/Constant_102_output_0": "c000760", + "/text_encoder/attn_encoder/attn_layers.3/Constant_103_output_0": "c000761", + "/text_encoder/attn_encoder/attn_layers.3/Constant_104_output_0": "c000762", + "/text_encoder/attn_encoder/attn_layers.3/Constant_105_output_0": "c000763", + "/text_encoder/attn_encoder/attn_layers.3/Constant_106_output_0": "c000764", + "/text_encoder/attn_encoder/attn_layers.3/Constant_107_output_0": "c000765", + "/text_encoder/attn_encoder/attn_layers.3/Constant_108_output_0": "c000766", + "/text_encoder/attn_encoder/attn_layers.3/Constant_109_output_0": "c000767", + "/text_encoder/attn_encoder/attn_layers.3/Constant_110_output_0": "c000768", + "/text_encoder/attn_encoder/attn_layers.3/Constant_111_output_0": "c000769", + "/text_encoder/attn_encoder/attn_layers.3/Constant_112_output_0": "c000770", + "/text_encoder/attn_encoder/attn_layers.3/Constant_113_output_0": "c000771", + "/text_encoder/attn_encoder/attn_layers.3/Constant_114_output_0": "c000772", + "onnx::Unsqueeze_3052": "c000773", + "onnx::Unsqueeze_3054": "c000774", + "onnx::Unsqueeze_3056": "c000775", + "onnx::Unsqueeze_3060": "c000776", + "/text_encoder/attn_encoder/attn_layers.3/Constant_115_output_0": "c000777", + "/text_encoder/attn_encoder/attn_layers.3/Constant_116_output_0": "c000778", + "/text_encoder/attn_encoder/attn_layers.3/Constant_117_output_0": "c000779", + "/text_encoder/attn_encoder/attn_layers.3/Constant_118_output_0": "c000780", + "/text_encoder/attn_encoder/attn_layers.3/Constant_119_output_0": "c000781", + "onnx::Unsqueeze_3073": "c000782", + "/text_encoder/attn_encoder/attn_layers.3/Constant_120_output_0": "c000783", + "/text_encoder/attn_encoder/attn_layers.3/Constant_121_output_0": "c000784", + "/text_encoder/attn_encoder/attn_layers.3/Constant_122_output_0": "c000785", + "/text_encoder/attn_encoder/attn_layers.3/Constant_123_output_0": "c000786", + "/text_encoder/attn_encoder/attn_layers.3/Constant_124_output_0": "c000787", + "/text_encoder/attn_encoder/attn_layers.3/Constant_125_output_0": "c000788", + "/text_encoder/attn_encoder/attn_layers.3/Constant_126_output_0": "c000789", + "/text_encoder/attn_encoder/attn_layers.3/Constant_127_output_0": "c000790", + "/text_encoder/attn_encoder/attn_layers.3/Constant_128_output_0": "c000791", + "/text_encoder/attn_encoder/attn_layers.3/Constant_129_output_0": "c000792", + "/text_encoder/attn_encoder/attn_layers.3/Constant_130_output_0": "c000793", + "/text_encoder/attn_encoder/attn_layers.3/Constant_131_output_0": "c000794", + "/text_encoder/attn_encoder/attn_layers.3/Constant_132_output_0": "c000795", + "/text_encoder/attn_encoder/attn_layers.3/Constant_133_output_0": "c000796", + "onnx::Unsqueeze_3110": "c000797", + "onnx::Unsqueeze_3112": "c000798", + "onnx::Unsqueeze_3114": "c000799", + "onnx::Unsqueeze_3116": "c000800", + "/text_encoder/attn_encoder/attn_layers.3/Constant_134_output_0": "c000801", + "/text_encoder/attn_encoder/attn_layers.3/Constant_135_output_0": "c000802", + "/text_encoder/attn_encoder/attn_layers.3/Constant_136_output_0": "c000803", + "/text_encoder/attn_encoder/attn_layers.3/Constant_137_output_0": "c000804", + "/text_encoder/attn_encoder/attn_layers.3/Constant_138_output_0": "c000805", + "/text_encoder/attn_encoder/attn_layers.3/Constant_139_output_0": "c000806", + "/text_encoder/attn_encoder/attn_layers.3/Constant_140_output_0": "c000807", + "/text_encoder/attn_encoder/attn_layers.3/Constant_141_output_0": "c000808", + "/text_encoder/attn_encoder/attn_layers.3/Constant_142_output_0": "c000809", + "/text_encoder/attn_encoder/attn_layers.3/Constant_143_output_0": "c000810", + "/text_encoder/attn_encoder/attn_layers.3/Constant_144_output_0": "c000811", + "/text_encoder/attn_encoder/attn_layers.3/Constant_145_output_0": "c000812", + "/text_encoder/attn_encoder/attn_layers.3/Constant_146_output_0": "c000813", + "/text_encoder/attn_encoder/attn_layers.3/Constant_147_output_0": "c000814", + "/text_encoder/attn_encoder/attn_layers.3/Constant_148_output_0": "c000815", + "/text_encoder/attn_encoder/attn_layers.3/Constant_149_output_0": "c000816", + "/text_encoder/attn_encoder/attn_layers.3/Constant_150_output_0": "c000817", + "onnx::Unsqueeze_3165": "c000818", + "onnx::Unsqueeze_3167": "c000819", + "onnx::Unsqueeze_3169": "c000820", + "onnx::Tile_3191": "c000821", + "/Constant_output_0": "c000822", + "/speech_prompted_text_encoder/attention1/Constant_output_0": "c000823", + "/speech_prompted_text_encoder/attention1/Constant_1_output_0": "c000824", + "/speech_prompted_text_encoder/attention1/Constant_2_output_0": "c000825", + "/speech_prompted_text_encoder/attention1/Constant_3_output_0": "c000826", + "/speech_prompted_text_encoder/attention1/Constant_4_output_0": "c000827", + "/speech_prompted_text_encoder/attention1/Constant_5_output_0": "c000828", + "/speech_prompted_text_encoder/attention1/Constant_6_output_0": "c000829", + "/speech_prompted_text_encoder/attention1/Constant_7_output_0": "c000830", + "/speech_prompted_text_encoder/attention1/Constant_8_output_0": "c000831", + "/speech_prompted_text_encoder/attention1/Constant_9_output_0": "c000832", + "/speech_prompted_text_encoder/attention1/Constant_10_output_0": "c000833", + "/speech_prompted_text_encoder/attention1/Constant_11_output_0": "c000834", + "/speech_prompted_text_encoder/attention1/Constant_12_output_0": "c000835", + "/speech_prompted_text_encoder/attention1/Constant_13_output_0": "c000836", + "/speech_prompted_text_encoder/attention1/Constant_14_output_0": "c000837", + "/speech_prompted_text_encoder/attention2/Constant_output_0": "c000838", + "/speech_prompted_text_encoder/attention2/Constant_1_output_0": "c000839", + "/speech_prompted_text_encoder/attention2/Constant_2_output_0": "c000840", + "/speech_prompted_text_encoder/attention2/Constant_3_output_0": "c000841", + "/speech_prompted_text_encoder/attention2/Constant_4_output_0": "c000842", + "/speech_prompted_text_encoder/attention2/Constant_5_output_0": "c000843", + "/speech_prompted_text_encoder/attention2/Constant_6_output_0": "c000844", + "/speech_prompted_text_encoder/attention2/Constant_7_output_0": "c000845", + "/speech_prompted_text_encoder/attention2/Constant_8_output_0": "c000846", + "/speech_prompted_text_encoder/attention2/Constant_9_output_0": "c000847", + "/speech_prompted_text_encoder/attention2/Constant_10_output_0": "c000848", + "/speech_prompted_text_encoder/attention2/Constant_11_output_0": "c000849", + "/speech_prompted_text_encoder/attention2/Constant_12_output_0": "c000850" + }, + "nodes": [ + { + "op_type": "Gather", + "name": "/text_encoder/text_embedder/char_embedder/Gather", + "inputs": [ + "tts.ttl.text_encoder.text_embedder.char_embedder.weight", + "text_ids" + ], + "outputs": [ + "/text_encoder/text_embedder/char_embedder/Gather_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/text_embedder/Transpose", + "inputs": [ + "/text_encoder/text_embedder/char_embedder/Gather_output_0" + ], + "outputs": [ + "/text_encoder/text_embedder/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/text_embedder/Mul", + "inputs": [ + "/text_encoder/text_embedder/Transpose_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/text_embedder/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.0/Mul", + "inputs": [ + "/text_encoder/text_embedder/Mul_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/convnext/convnext.0/dwconv/ConstantOfShape", + "inputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/dwconv/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/convnext/convnext.0/dwconv/Concat", + "inputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Constant_1_output_0", + "/text_encoder/convnext/convnext.0/dwconv/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.0/dwconv/Reshape", + "inputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Concat_output_0", + "/text_encoder/convnext/convnext.0/dwconv/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/convnext/convnext.0/dwconv/Slice", + "inputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Reshape_output_0", + "/text_encoder/convnext/convnext.0/dwconv/Constant_4_output_0", + "/text_encoder/convnext/convnext.0/dwconv/Constant_5_output_0", + "/text_encoder/convnext/convnext.0/dwconv/Constant_3_output_0", + "/text_encoder/convnext/convnext.0/dwconv/Constant_6_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.0/dwconv/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Slice_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Transpose_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.0/dwconv/Reshape_1", + "inputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Transpose_output_0", + "/text_encoder/convnext/convnext.0/dwconv/Constant_7_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/convnext/convnext.0/dwconv/Cast", + "inputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/convnext/convnext.0/dwconv/Pad", + "inputs": [ + "/text_encoder/convnext/convnext.0/Mul_output_0", + "/text_encoder/convnext/convnext.0/dwconv/Cast_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Pad_output_0" + ], + "attrs": { + "mode": "edge" + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.0/dwconv/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Pad_output_0", + "tts.ttl.text_encoder.convnext.convnext.0.dwconv.weight", + "tts.ttl.text_encoder.convnext.convnext.0.dwconv.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 256, + "kernel_shape": [ + 5 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.0/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.0/dwconv/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.0/norm/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.0/Mul_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/norm/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/convnext/convnext.0/norm/norm/LayerNormalization", + "inputs": [ + "/text_encoder/convnext/convnext.0/norm/Transpose_output_0", + "tts.ttl.text_encoder.convnext.convnext.0.norm.norm.weight", + "tts.ttl.text_encoder.convnext.convnext.0.norm.norm.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/norm/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.0/norm/Transpose_1", + "inputs": [ + "/text_encoder/convnext/convnext.0/norm/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/norm/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.0/pwconv1/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.0/norm/Transpose_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.0.pwconv1.weight", + "tts.ttl.text_encoder.convnext.convnext.0.pwconv1.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/pwconv1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/convnext/convnext.0/act/Div", + "inputs": [ + "/text_encoder/convnext/convnext.0/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.0/act/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/act/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "Erf", + "name": "/text_encoder/convnext/convnext.0/act/Erf", + "inputs": [ + "/text_encoder/convnext/convnext.0/act/Div_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/act/Erf_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.0/act/Add", + "inputs": [ + "/text_encoder/convnext/convnext.0/act/Erf_output_0", + "/text_encoder/convnext/convnext.0/act/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/act/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.0/act/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.0/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.0/act/Add_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/act/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.0/act/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.0/act/Mul_output_0", + "/text_encoder/convnext/convnext.0/act/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/act/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.0/pwconv2/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.0/act/Mul_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.0.pwconv2.weight", + "tts.ttl.text_encoder.convnext.convnext.0.pwconv2.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/pwconv2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.0/Mul_2", + "inputs": [ + "tts.ttl.text_encoder.convnext.convnext.0.gamma", + "/text_encoder/convnext/convnext.0/pwconv2/Conv_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.0/Add", + "inputs": [ + "/text_encoder/convnext/convnext.0/Mul_output_0", + "/text_encoder/convnext/convnext.0/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.0/Mul_3", + "inputs": [ + "/text_encoder/convnext/convnext.0/Add_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.0/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.1/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.0/Mul_3_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/convnext/convnext.1/dwconv/ConstantOfShape", + "inputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/dwconv/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/convnext/convnext.1/dwconv/Concat", + "inputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Constant_1_output_0", + "/text_encoder/convnext/convnext.1/dwconv/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.1/dwconv/Reshape", + "inputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Concat_output_0", + "/text_encoder/convnext/convnext.1/dwconv/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/convnext/convnext.1/dwconv/Slice", + "inputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Reshape_output_0", + "/text_encoder/convnext/convnext.1/dwconv/Constant_4_output_0", + "/text_encoder/convnext/convnext.1/dwconv/Constant_5_output_0", + "/text_encoder/convnext/convnext.1/dwconv/Constant_3_output_0", + "/text_encoder/convnext/convnext.1/dwconv/Constant_6_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.1/dwconv/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Slice_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Transpose_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.1/dwconv/Reshape_1", + "inputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Transpose_output_0", + "/text_encoder/convnext/convnext.1/dwconv/Constant_7_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/convnext/convnext.1/dwconv/Cast", + "inputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/convnext/convnext.1/dwconv/Pad", + "inputs": [ + "/text_encoder/convnext/convnext.1/Mul_output_0", + "/text_encoder/convnext/convnext.1/dwconv/Cast_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Pad_output_0" + ], + "attrs": { + "mode": "edge" + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.1/dwconv/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Pad_output_0", + "tts.ttl.text_encoder.convnext.convnext.1.dwconv.weight", + "tts.ttl.text_encoder.convnext.convnext.1.dwconv.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 256, + "kernel_shape": [ + 5 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.1/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.1/dwconv/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.1/norm/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.1/Mul_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/norm/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/convnext/convnext.1/norm/norm/LayerNormalization", + "inputs": [ + "/text_encoder/convnext/convnext.1/norm/Transpose_output_0", + "tts.ttl.text_encoder.convnext.convnext.1.norm.norm.weight", + "tts.ttl.text_encoder.convnext.convnext.1.norm.norm.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/norm/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.1/norm/Transpose_1", + "inputs": [ + "/text_encoder/convnext/convnext.1/norm/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/norm/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.1/pwconv1/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.1/norm/Transpose_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.1.pwconv1.weight", + "tts.ttl.text_encoder.convnext.convnext.1.pwconv1.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/pwconv1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/convnext/convnext.1/act/Div", + "inputs": [ + "/text_encoder/convnext/convnext.1/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.1/act/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/act/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "Erf", + "name": "/text_encoder/convnext/convnext.1/act/Erf", + "inputs": [ + "/text_encoder/convnext/convnext.1/act/Div_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/act/Erf_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.1/act/Add", + "inputs": [ + "/text_encoder/convnext/convnext.1/act/Erf_output_0", + "/text_encoder/convnext/convnext.1/act/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/act/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.1/act/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.1/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.1/act/Add_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/act/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.1/act/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.1/act/Mul_output_0", + "/text_encoder/convnext/convnext.1/act/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/act/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.1/pwconv2/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.1/act/Mul_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.1.pwconv2.weight", + "tts.ttl.text_encoder.convnext.convnext.1.pwconv2.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/pwconv2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.1/Mul_2", + "inputs": [ + "tts.ttl.text_encoder.convnext.convnext.1.gamma", + "/text_encoder/convnext/convnext.1/pwconv2/Conv_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.1/Add", + "inputs": [ + "/text_encoder/convnext/convnext.1/Mul_output_0", + "/text_encoder/convnext/convnext.1/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.1/Mul_3", + "inputs": [ + "/text_encoder/convnext/convnext.1/Add_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.1/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.2/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.1/Mul_3_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/convnext/convnext.2/dwconv/ConstantOfShape", + "inputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/dwconv/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/convnext/convnext.2/dwconv/Concat", + "inputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Constant_1_output_0", + "/text_encoder/convnext/convnext.2/dwconv/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.2/dwconv/Reshape", + "inputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Concat_output_0", + "/text_encoder/convnext/convnext.2/dwconv/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/convnext/convnext.2/dwconv/Slice", + "inputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Reshape_output_0", + "/text_encoder/convnext/convnext.2/dwconv/Constant_4_output_0", + "/text_encoder/convnext/convnext.2/dwconv/Constant_5_output_0", + "/text_encoder/convnext/convnext.2/dwconv/Constant_3_output_0", + "/text_encoder/convnext/convnext.2/dwconv/Constant_6_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.2/dwconv/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Slice_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Transpose_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.2/dwconv/Reshape_1", + "inputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Transpose_output_0", + "/text_encoder/convnext/convnext.2/dwconv/Constant_7_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/convnext/convnext.2/dwconv/Cast", + "inputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/convnext/convnext.2/dwconv/Pad", + "inputs": [ + "/text_encoder/convnext/convnext.2/Mul_output_0", + "/text_encoder/convnext/convnext.2/dwconv/Cast_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Pad_output_0" + ], + "attrs": { + "mode": "edge" + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.2/dwconv/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Pad_output_0", + "tts.ttl.text_encoder.convnext.convnext.2.dwconv.weight", + "tts.ttl.text_encoder.convnext.convnext.2.dwconv.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Conv_output_0" + ], + "attrs": { + "dilations": [ + 2 + ], + "group": 256, + "kernel_shape": [ + 5 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.2/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.2/dwconv/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.2/norm/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.2/Mul_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/norm/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/convnext/convnext.2/norm/norm/LayerNormalization", + "inputs": [ + "/text_encoder/convnext/convnext.2/norm/Transpose_output_0", + "tts.ttl.text_encoder.convnext.convnext.2.norm.norm.weight", + "tts.ttl.text_encoder.convnext.convnext.2.norm.norm.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/norm/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.2/norm/Transpose_1", + "inputs": [ + "/text_encoder/convnext/convnext.2/norm/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/norm/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.2/pwconv1/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.2/norm/Transpose_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.2.pwconv1.weight", + "tts.ttl.text_encoder.convnext.convnext.2.pwconv1.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/pwconv1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/convnext/convnext.2/act/Div", + "inputs": [ + "/text_encoder/convnext/convnext.2/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.2/act/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/act/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "Erf", + "name": "/text_encoder/convnext/convnext.2/act/Erf", + "inputs": [ + "/text_encoder/convnext/convnext.2/act/Div_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/act/Erf_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.2/act/Add", + "inputs": [ + "/text_encoder/convnext/convnext.2/act/Erf_output_0", + "/text_encoder/convnext/convnext.2/act/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/act/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.2/act/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.2/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.2/act/Add_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/act/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.2/act/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.2/act/Mul_output_0", + "/text_encoder/convnext/convnext.2/act/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/act/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.2/pwconv2/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.2/act/Mul_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.2.pwconv2.weight", + "tts.ttl.text_encoder.convnext.convnext.2.pwconv2.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/pwconv2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.2/Mul_2", + "inputs": [ + "tts.ttl.text_encoder.convnext.convnext.2.gamma", + "/text_encoder/convnext/convnext.2/pwconv2/Conv_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.2/Add", + "inputs": [ + "/text_encoder/convnext/convnext.2/Mul_output_0", + "/text_encoder/convnext/convnext.2/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.2/Mul_3", + "inputs": [ + "/text_encoder/convnext/convnext.2/Add_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.2/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.3/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.2/Mul_3_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/convnext/convnext.3/dwconv/ConstantOfShape", + "inputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/dwconv/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/convnext/convnext.3/dwconv/Concat", + "inputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Constant_1_output_0", + "/text_encoder/convnext/convnext.3/dwconv/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.3/dwconv/Reshape", + "inputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Concat_output_0", + "/text_encoder/convnext/convnext.3/dwconv/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/convnext/convnext.3/dwconv/Slice", + "inputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Reshape_output_0", + "/text_encoder/convnext/convnext.3/dwconv/Constant_4_output_0", + "/text_encoder/convnext/convnext.3/dwconv/Constant_5_output_0", + "/text_encoder/convnext/convnext.3/dwconv/Constant_3_output_0", + "/text_encoder/convnext/convnext.3/dwconv/Constant_6_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.3/dwconv/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Slice_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Transpose_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.3/dwconv/Reshape_1", + "inputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Transpose_output_0", + "/text_encoder/convnext/convnext.3/dwconv/Constant_7_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/convnext/convnext.3/dwconv/Cast", + "inputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/convnext/convnext.3/dwconv/Pad", + "inputs": [ + "/text_encoder/convnext/convnext.3/Mul_output_0", + "/text_encoder/convnext/convnext.3/dwconv/Cast_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Pad_output_0" + ], + "attrs": { + "mode": "edge" + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.3/dwconv/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Pad_output_0", + "tts.ttl.text_encoder.convnext.convnext.3.dwconv.weight", + "tts.ttl.text_encoder.convnext.convnext.3.dwconv.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Conv_output_0" + ], + "attrs": { + "dilations": [ + 2 + ], + "group": 256, + "kernel_shape": [ + 5 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.3/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.3/dwconv/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.3/norm/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.3/Mul_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/norm/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/convnext/convnext.3/norm/norm/LayerNormalization", + "inputs": [ + "/text_encoder/convnext/convnext.3/norm/Transpose_output_0", + "tts.ttl.text_encoder.convnext.convnext.3.norm.norm.weight", + "tts.ttl.text_encoder.convnext.convnext.3.norm.norm.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/norm/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.3/norm/Transpose_1", + "inputs": [ + "/text_encoder/convnext/convnext.3/norm/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/norm/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.3/pwconv1/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.3/norm/Transpose_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.3.pwconv1.weight", + "tts.ttl.text_encoder.convnext.convnext.3.pwconv1.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/pwconv1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/convnext/convnext.3/act/Div", + "inputs": [ + "/text_encoder/convnext/convnext.3/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.3/act/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/act/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "Erf", + "name": "/text_encoder/convnext/convnext.3/act/Erf", + "inputs": [ + "/text_encoder/convnext/convnext.3/act/Div_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/act/Erf_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.3/act/Add", + "inputs": [ + "/text_encoder/convnext/convnext.3/act/Erf_output_0", + "/text_encoder/convnext/convnext.3/act/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/act/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.3/act/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.3/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.3/act/Add_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/act/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.3/act/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.3/act/Mul_output_0", + "/text_encoder/convnext/convnext.3/act/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/act/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.3/pwconv2/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.3/act/Mul_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.3.pwconv2.weight", + "tts.ttl.text_encoder.convnext.convnext.3.pwconv2.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/pwconv2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.3/Mul_2", + "inputs": [ + "tts.ttl.text_encoder.convnext.convnext.3.gamma", + "/text_encoder/convnext/convnext.3/pwconv2/Conv_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.3/Add", + "inputs": [ + "/text_encoder/convnext/convnext.3/Mul_output_0", + "/text_encoder/convnext/convnext.3/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.3/Mul_3", + "inputs": [ + "/text_encoder/convnext/convnext.3/Add_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.3/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.4/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.3/Mul_3_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/convnext/convnext.4/dwconv/ConstantOfShape", + "inputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/dwconv/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/convnext/convnext.4/dwconv/Concat", + "inputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Constant_1_output_0", + "/text_encoder/convnext/convnext.4/dwconv/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.4/dwconv/Reshape", + "inputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Concat_output_0", + "/text_encoder/convnext/convnext.4/dwconv/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/convnext/convnext.4/dwconv/Slice", + "inputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Reshape_output_0", + "/text_encoder/convnext/convnext.4/dwconv/Constant_4_output_0", + "/text_encoder/convnext/convnext.4/dwconv/Constant_5_output_0", + "/text_encoder/convnext/convnext.4/dwconv/Constant_3_output_0", + "/text_encoder/convnext/convnext.4/dwconv/Constant_6_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.4/dwconv/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Slice_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Transpose_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.4/dwconv/Reshape_1", + "inputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Transpose_output_0", + "/text_encoder/convnext/convnext.4/dwconv/Constant_7_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/convnext/convnext.4/dwconv/Cast", + "inputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/convnext/convnext.4/dwconv/Pad", + "inputs": [ + "/text_encoder/convnext/convnext.4/Mul_output_0", + "/text_encoder/convnext/convnext.4/dwconv/Cast_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Pad_output_0" + ], + "attrs": { + "mode": "edge" + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.4/dwconv/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Pad_output_0", + "tts.ttl.text_encoder.convnext.convnext.4.dwconv.weight", + "tts.ttl.text_encoder.convnext.convnext.4.dwconv.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Conv_output_0" + ], + "attrs": { + "dilations": [ + 4 + ], + "group": 256, + "kernel_shape": [ + 5 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.4/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.4/dwconv/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.4/norm/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.4/Mul_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/norm/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/convnext/convnext.4/norm/norm/LayerNormalization", + "inputs": [ + "/text_encoder/convnext/convnext.4/norm/Transpose_output_0", + "tts.ttl.text_encoder.convnext.convnext.4.norm.norm.weight", + "tts.ttl.text_encoder.convnext.convnext.4.norm.norm.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/norm/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.4/norm/Transpose_1", + "inputs": [ + "/text_encoder/convnext/convnext.4/norm/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/norm/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.4/pwconv1/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.4/norm/Transpose_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.4.pwconv1.weight", + "tts.ttl.text_encoder.convnext.convnext.4.pwconv1.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/pwconv1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/convnext/convnext.4/act/Div", + "inputs": [ + "/text_encoder/convnext/convnext.4/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.4/act/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/act/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "Erf", + "name": "/text_encoder/convnext/convnext.4/act/Erf", + "inputs": [ + "/text_encoder/convnext/convnext.4/act/Div_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/act/Erf_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.4/act/Add", + "inputs": [ + "/text_encoder/convnext/convnext.4/act/Erf_output_0", + "/text_encoder/convnext/convnext.4/act/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/act/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.4/act/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.4/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.4/act/Add_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/act/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.4/act/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.4/act/Mul_output_0", + "/text_encoder/convnext/convnext.4/act/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/act/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.4/pwconv2/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.4/act/Mul_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.4.pwconv2.weight", + "tts.ttl.text_encoder.convnext.convnext.4.pwconv2.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/pwconv2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.4/Mul_2", + "inputs": [ + "tts.ttl.text_encoder.convnext.convnext.4.gamma", + "/text_encoder/convnext/convnext.4/pwconv2/Conv_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.4/Add", + "inputs": [ + "/text_encoder/convnext/convnext.4/Mul_output_0", + "/text_encoder/convnext/convnext.4/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.4/Mul_3", + "inputs": [ + "/text_encoder/convnext/convnext.4/Add_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.4/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.5/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.4/Mul_3_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/convnext/convnext.5/dwconv/ConstantOfShape", + "inputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/dwconv/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/convnext/convnext.5/dwconv/Concat", + "inputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Constant_1_output_0", + "/text_encoder/convnext/convnext.5/dwconv/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.5/dwconv/Reshape", + "inputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Concat_output_0", + "/text_encoder/convnext/convnext.5/dwconv/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/convnext/convnext.5/dwconv/Slice", + "inputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Reshape_output_0", + "/text_encoder/convnext/convnext.5/dwconv/Constant_4_output_0", + "/text_encoder/convnext/convnext.5/dwconv/Constant_5_output_0", + "/text_encoder/convnext/convnext.5/dwconv/Constant_3_output_0", + "/text_encoder/convnext/convnext.5/dwconv/Constant_6_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.5/dwconv/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Slice_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Transpose_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/convnext/convnext.5/dwconv/Reshape_1", + "inputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Transpose_output_0", + "/text_encoder/convnext/convnext.5/dwconv/Constant_7_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/convnext/convnext.5/dwconv/Cast", + "inputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/convnext/convnext.5/dwconv/Pad", + "inputs": [ + "/text_encoder/convnext/convnext.5/Mul_output_0", + "/text_encoder/convnext/convnext.5/dwconv/Cast_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Pad_output_0" + ], + "attrs": { + "mode": "edge" + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.5/dwconv/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Pad_output_0", + "tts.ttl.text_encoder.convnext.convnext.5.dwconv.weight", + "tts.ttl.text_encoder.convnext.convnext.5.dwconv.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Conv_output_0" + ], + "attrs": { + "dilations": [ + 4 + ], + "group": 256, + "kernel_shape": [ + 5 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.5/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.5/dwconv/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.5/norm/Transpose", + "inputs": [ + "/text_encoder/convnext/convnext.5/Mul_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/norm/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/convnext/convnext.5/norm/norm/LayerNormalization", + "inputs": [ + "/text_encoder/convnext/convnext.5/norm/Transpose_output_0", + "tts.ttl.text_encoder.convnext.convnext.5.norm.norm.weight", + "tts.ttl.text_encoder.convnext.convnext.5.norm.norm.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/norm/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/convnext/convnext.5/norm/Transpose_1", + "inputs": [ + "/text_encoder/convnext/convnext.5/norm/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/norm/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.5/pwconv1/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.5/norm/Transpose_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.5.pwconv1.weight", + "tts.ttl.text_encoder.convnext.convnext.5.pwconv1.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/pwconv1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/convnext/convnext.5/act/Div", + "inputs": [ + "/text_encoder/convnext/convnext.5/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.5/act/Constant_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/act/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "Erf", + "name": "/text_encoder/convnext/convnext.5/act/Erf", + "inputs": [ + "/text_encoder/convnext/convnext.5/act/Div_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/act/Erf_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.5/act/Add", + "inputs": [ + "/text_encoder/convnext/convnext.5/act/Erf_output_0", + "/text_encoder/convnext/convnext.5/act/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/act/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.5/act/Mul", + "inputs": [ + "/text_encoder/convnext/convnext.5/pwconv1/Conv_output_0", + "/text_encoder/convnext/convnext.5/act/Add_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/act/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.5/act/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.5/act/Mul_output_0", + "/text_encoder/convnext/convnext.5/act/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/act/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/convnext/convnext.5/pwconv2/Conv", + "inputs": [ + "/text_encoder/convnext/convnext.5/act/Mul_1_output_0", + "tts.ttl.text_encoder.convnext.convnext.5.pwconv2.weight", + "tts.ttl.text_encoder.convnext.convnext.5.pwconv2.bias" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/pwconv2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.5/Mul_2", + "inputs": [ + "tts.ttl.text_encoder.convnext.convnext.5.gamma", + "/text_encoder/convnext/convnext.5/pwconv2/Conv_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/convnext/convnext.5/Add", + "inputs": [ + "/text_encoder/convnext/convnext.5/Mul_output_0", + "/text_encoder/convnext/convnext.5/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/convnext/convnext.5/Mul_3", + "inputs": [ + "/text_encoder/convnext/convnext.5/Add_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/convnext/convnext.5/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/Unsqueeze", + "inputs": [ + "text_mask", + "/text_encoder/attn_encoder/Constant_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Unsqueeze_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/Unsqueeze_1", + "inputs": [ + "text_mask", + "/text_encoder/attn_encoder/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Unsqueeze_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/Mul", + "inputs": [ + "/text_encoder/attn_encoder/Unsqueeze_output_0", + "/text_encoder/attn_encoder/Unsqueeze_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/Mul_1", + "inputs": [ + "/text_encoder/convnext/convnext.5/Mul_3_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.0/conv_q/Conv", + "inputs": [ + "/text_encoder/attn_encoder/Mul_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_q.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_q.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_q/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.0/conv_k/Conv", + "inputs": [ + "/text_encoder/attn_encoder/Mul_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_k.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_k.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_k/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.0/conv_v/Conv", + "inputs": [ + "/text_encoder/attn_encoder/Mul_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_v.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_v.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_v/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_2_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_q/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_3_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_3_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_output_0", + "onnx::Unsqueeze_1234" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_3_output_0", + "onnx::Unsqueeze_1240" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_4_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_5_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_q/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Concat_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_output_0", + "onnx::Unsqueeze_1246" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_2_output_0", + "onnx::Unsqueeze_1252" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_2_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_6_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_output_0", + "onnx::Unsqueeze_1255" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_2_output_0", + "onnx::Unsqueeze_1261" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_4_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_8_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_9_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_k/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Concat_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_v/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Concat_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_2_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/attn_encoder/attn_layers.0/Div", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.0/MatMul", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Div_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_2_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_11_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_output_0" + ], + "attrs": {} + }, + { + "op_type": "Clip", + "name": "/text_encoder/attn_encoder/attn_layers.0/Clip", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_12_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_13_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Gather_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Clip", + "name": "/text_encoder/attn_encoder/attn_layers.0/Clip_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_14_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.0/Mul", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_2_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.0/Add", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Mul_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Add_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_16_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_output_0", + "onnx::Unsqueeze_1291" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_output_0", + "onnx::Unsqueeze_1293" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_17_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_18_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_6_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_19_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_20_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_3_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_output_0", + "onnx::Unsqueeze_1304" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_output_0", + "onnx::Unsqueeze_1306" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_21_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_22_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_8_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_9_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_23_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_24_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_4_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_output_0", + "onnx::Unsqueeze_1317" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_output_0", + "onnx::Unsqueeze_1319" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_11_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_25_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_26_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_10_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_11_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_27_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_28_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_5_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_output_0", + "onnx::Unsqueeze_1330" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_12_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_output_0", + "onnx::Unsqueeze_1332" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_13_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_29_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_30_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_12_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_13_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_31_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_32_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_6_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_4_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_33_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_4_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_34_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Gather_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_output_0", + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_7_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_35_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_3_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_3_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_37_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_38_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_36_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_39_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_2_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_2_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_40_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_4_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_1_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.0/Pad", + "inputs": [ + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.emb_rel_k", + "/text_encoder/attn_encoder/attn_layers.0/Cast_1_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_42_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_14_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_2_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_43_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_15_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_14_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_15_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_41_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_44_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_45_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_16_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_16_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_3_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.0/MatMul_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Div_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Transpose_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_5_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_46_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_5_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_6_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_47_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_6_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_48_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_7_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_49_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_1_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_50_output_0", + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_8_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_8_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_51_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_5_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_5_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_53_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_54_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_52_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_55_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_4_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_4_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_56_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_6_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_2_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.0/Pad_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Cast_2_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_1_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.0/Mul_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_57_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.0/Mul_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Mul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Gather_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_5_output_0", + "onnx::Unsqueeze_1410" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_17_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_6_output_0", + "onnx::Unsqueeze_1412" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_18_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Mul_2_output_0", + "onnx::Unsqueeze_1414" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_19_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_17_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_18_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_19_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_9_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Concat_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_7_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_58_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_20", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_4_output_0", + "onnx::Unsqueeze_1422" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_20_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_59_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_20_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_60_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_61_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_62_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_63_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_10_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_21", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_4_output_0", + "onnx::Unsqueeze_1435" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_21_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_64_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_21_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_65_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_66_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_67_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_68_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_11_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_8_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_69_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_8_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_70_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Gather_8_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_11_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_3_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_2_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_3_output_0", + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_12_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_12_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_71_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_8_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_8_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_73_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_74_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_72_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_75_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_5_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_5_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_76_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_9_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_4_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.0/Pad_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Cast_4_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_2_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.0/Add_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_77_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Add_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Mul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_78_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_22", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_5_output_0", + "onnx::Unsqueeze_1472" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_22_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_23", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_6_output_0", + "onnx::Unsqueeze_1474" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_23_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_24", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Add_1_output_0", + "onnx::Unsqueeze_1476" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_24_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_25", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_6_output_0", + "onnx::Unsqueeze_1478" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_25_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_22_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_23_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_24_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_25_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_13_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_2_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Concat_13_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_10_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_26", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_81_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_26_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_10_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_80_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_26_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_79_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_82_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_27", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_4_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_84_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_27_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_4_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_27_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_85_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_83_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_86_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.0/Add_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Slice_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Add_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Equal", + "name": "/text_encoder/attn_encoder/attn_layers.0/Equal", + "inputs": [ + "/text_encoder/attn_encoder/Mul_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_87_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Equal_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Equal_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_5_output_0" + ], + "attrs": { + "to": 9 + } + }, + { + "op_type": "Where", + "name": "/text_encoder/attn_encoder/attn_layers.0/Where", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_5_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_88_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Add_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Where_output_0" + ], + "attrs": {} + }, + { + "op_type": "Softmax", + "name": "/text_encoder/attn_encoder/attn_layers.0/Softmax", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Where_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Softmax_output_0" + ], + "attrs": { + "axis": -1 + } + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.0/MatMul_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Softmax_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Transpose_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_9_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_89_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_9_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_10_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_90_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_10_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_11_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_11_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_91_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_11_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_92_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_28", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_7_output_0", + "onnx::Unsqueeze_1521" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_28_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_93_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_28_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_94_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_95_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_96_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_97_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_98_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_99_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_14_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_29", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_7_output_0", + "onnx::Unsqueeze_1538" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_29_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_100_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_29_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_101_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_102_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_103_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_104_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_105_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_106_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_15_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_14_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_12_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_12_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_107_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_12_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_108_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Gather_12_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_6_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_8_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_3_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_6_output_0", + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_16_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_16_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_109_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_11_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_11_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_111_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_112_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_110_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_113_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_6_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_6_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_114_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_12_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_12_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_7_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.0/Pad_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Softmax_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Cast_7_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_3_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Pow", + "name": "/text_encoder/attn_encoder/attn_layers.0/Pow", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_115_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pow_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.0/Mul_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Sub_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.0/Add_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pow_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Mul_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Add_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_30", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_9_output_0", + "onnx::Unsqueeze_1579" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_30_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_31", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_10_output_0", + "onnx::Unsqueeze_1581" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_31_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_32", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Add_3_output_0", + "onnx::Unsqueeze_1583" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_32_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_30_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_31_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_32_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_17_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_3_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Concat_17_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_13_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_33", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_11_output_0", + "onnx::Unsqueeze_1587" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_33_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_33_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_116_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_117_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_118_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_119_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_120_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_18_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_34", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_11_output_0", + "onnx::Unsqueeze_1600" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_34_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_34_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_121_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_122_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_123_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_124_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_125_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_19_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_18_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_13_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_13_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_126_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_13_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_127_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Gather_13_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_19_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_8_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_4_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_20", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_8_output_0", + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_20_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_20_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_128_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_14_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_14_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_130_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_131_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_129_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_132_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_7_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_7_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_133_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_15_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_9_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.0/Pad_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_13_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Cast_9_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_4_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.0/Mul_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_134_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Mul_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_35", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_9_output_0", + "onnx::Unsqueeze_1637" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_35_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_36", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_10_output_0", + "onnx::Unsqueeze_1639" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_36_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_37", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_11_output_0", + "onnx::Unsqueeze_1641" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_37_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_38", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Mul_4_output_0", + "onnx::Unsqueeze_1643" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_38_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_21", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_35_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_36_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_37_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_38_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_21_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_4_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Concat_21_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_16_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_16_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_136_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_137_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_135_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_138_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Shape_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_14_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.0/Gather_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Shape_14_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_139_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_14_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.0/Sub_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Constant_140_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Gather_14_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_10_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_5_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_22", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_10_output_0", + "/text_encoder/attn_encoder/attn_layers.0/ConstantOfShape_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_22_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_22_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_141_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_17_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_17_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_143_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_144_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_142_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_145_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_8_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_8_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_146_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_18_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.0/Cast_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_18_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Cast_11_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.0/Pad_5", + "inputs": [ + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.emb_rel_v", + "/text_encoder/attn_encoder/attn_layers.0/Cast_11_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_5_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_39", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_148_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_39_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_40", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Sub_2_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_149_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_40_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.0/Slice_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Pad_5_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_39_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_40_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_147_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_150_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_41", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_10_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Constant_151_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_41_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.0/MatMul_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Slice_8_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_41_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.0/Add_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/MatMul_2_output_0", + "/text_encoder/attn_encoder/attn_layers.0/MatMul_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Add_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.0/Transpose_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Add_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_9_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_42", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_output_0", + "onnx::Unsqueeze_1692" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_42_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_43", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_1_output_0", + "onnx::Unsqueeze_1694" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_43_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_44", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Gather_3_output_0", + "onnx::Unsqueeze_1696" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_44_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.0/Concat_23", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_42_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_43_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Unsqueeze_44_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Concat_23_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.0/Reshape_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Transpose_9_output_0", + "/text_encoder/attn_encoder/attn_layers.0/Concat_23_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_19_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.0/conv_o/Conv", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Reshape_19_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_o.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.0.conv_o.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.0/conv_o/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/Add", + "inputs": [ + "/text_encoder/attn_encoder/Mul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.0/conv_o/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_1.0/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/Add_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.0/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/attn_encoder/norm_layers_1.0/norm/LayerNormalization", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.0/Transpose_output_0", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.0.norm.weight", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.0.norm.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.0/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_1.0/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.0/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.0/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.0/Mul", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.0/Transpose_1_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/ffn_layers.0/conv_1/Conv", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/Mul_output_0", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.0.conv_1.weight", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.0.conv_1.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/conv_1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Relu", + "name": "/text_encoder/attn_encoder/ffn_layers.0/Relu", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/conv_1/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/Relu_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.0/Mul_1", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/Relu_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/ffn_layers.0/conv_2/Conv", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/Mul_1_output_0", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.0.conv_2.weight", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.0.conv_2.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/conv_2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.0/Mul_2", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/conv_2/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.0/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/Add_1", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.0/Transpose_1_output_0", + "/text_encoder/attn_encoder/ffn_layers.0/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Add_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_2.0/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/Add_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.0/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/attn_encoder/norm_layers_2.0/norm/LayerNormalization", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.0/Transpose_output_0", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.0.norm.weight", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.0.norm.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.0/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_2.0/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.0/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.0/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.1/conv_q/Conv", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.0/Transpose_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_q.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_q.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_q/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.1/conv_k/Conv", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.0/Transpose_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_k.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_k.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_k/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.1/conv_v/Conv", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.0/Transpose_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_v.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_v.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_v/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_2_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_q/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_3_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_3_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_output_0", + "onnx::Unsqueeze_1730" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_3_output_0", + "onnx::Unsqueeze_1736" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_4_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_5_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_q/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Concat_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_output_0", + "onnx::Unsqueeze_1741" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_2_output_0", + "onnx::Unsqueeze_1747" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_2_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_6_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_output_0", + "onnx::Unsqueeze_1750" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_2_output_0", + "onnx::Unsqueeze_1756" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_4_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_8_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_9_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_k/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Concat_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_v/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Concat_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_2_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/attn_encoder/attn_layers.1/Div", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.1/MatMul", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Div_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_2_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_11_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_output_0" + ], + "attrs": {} + }, + { + "op_type": "Clip", + "name": "/text_encoder/attn_encoder/attn_layers.1/Clip", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_12_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_13_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Gather_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Clip", + "name": "/text_encoder/attn_encoder/attn_layers.1/Clip_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_14_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.1/Mul", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_2_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.1/Add", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Mul_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Add_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_16_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_output_0", + "onnx::Unsqueeze_1786" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_output_0", + "onnx::Unsqueeze_1788" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_17_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_18_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_6_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_19_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_20_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_3_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_output_0", + "onnx::Unsqueeze_1799" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_output_0", + "onnx::Unsqueeze_1801" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_21_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_22_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_8_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_9_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_23_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_24_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_4_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_output_0", + "onnx::Unsqueeze_1812" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_output_0", + "onnx::Unsqueeze_1814" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_11_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_25_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_26_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_10_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_11_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_27_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_28_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_5_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_output_0", + "onnx::Unsqueeze_1825" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_12_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_output_0", + "onnx::Unsqueeze_1827" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_13_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_29_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_30_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_12_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_13_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_31_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_32_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_6_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_4_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_33_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_4_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_34_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Gather_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_output_0", + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_7_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_35_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_3_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_3_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_37_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_38_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_36_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_39_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_2_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_2_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_40_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_4_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_1_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.1/Pad", + "inputs": [ + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.emb_rel_k", + "/text_encoder/attn_encoder/attn_layers.1/Cast_1_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_42_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_14_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_2_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_43_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_15_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_14_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_15_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_41_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_44_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_45_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_16_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_16_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_3_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.1/MatMul_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Div_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Transpose_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_5_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_46_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_5_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_6_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_47_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_6_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_48_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_7_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_49_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_1_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_50_output_0", + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_8_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_8_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_51_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_5_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_5_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_53_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_54_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_52_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_55_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_4_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_4_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_56_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_6_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_2_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.1/Pad_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Cast_2_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_1_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.1/Mul_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_57_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.1/Mul_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Mul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Gather_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_5_output_0", + "onnx::Unsqueeze_1903" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_17_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_6_output_0", + "onnx::Unsqueeze_1905" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_18_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Mul_2_output_0", + "onnx::Unsqueeze_1907" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_19_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_17_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_18_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_19_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_9_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Concat_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_7_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_58_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_20", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_4_output_0", + "onnx::Unsqueeze_1915" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_20_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_59_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_20_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_60_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_61_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_62_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_63_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_10_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_21", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_4_output_0", + "onnx::Unsqueeze_1928" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_21_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_64_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_21_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_65_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_66_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_67_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_68_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_11_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_8_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_69_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_8_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_70_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Gather_8_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_11_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_3_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_2_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_3_output_0", + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_12_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_12_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_71_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_8_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_8_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_73_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_74_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_72_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_75_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_5_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_5_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_76_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_9_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_4_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.1/Pad_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Cast_4_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_2_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.1/Add_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_77_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Add_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Mul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_78_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_22", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_5_output_0", + "onnx::Unsqueeze_1965" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_22_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_23", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_6_output_0", + "onnx::Unsqueeze_1967" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_23_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_24", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Add_1_output_0", + "onnx::Unsqueeze_1969" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_24_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_25", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_6_output_0", + "onnx::Unsqueeze_1971" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_25_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_22_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_23_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_24_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_25_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_13_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_2_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Concat_13_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_10_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_26", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_81_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_26_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_10_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_80_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_26_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_79_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_82_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_27", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_4_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_84_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_27_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_4_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_27_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_85_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_83_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_86_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.1/Add_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Slice_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Add_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Equal_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_5_output_0" + ], + "attrs": { + "to": 9 + } + }, + { + "op_type": "Where", + "name": "/text_encoder/attn_encoder/attn_layers.1/Where", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_5_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_87_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Add_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Where_output_0" + ], + "attrs": {} + }, + { + "op_type": "Softmax", + "name": "/text_encoder/attn_encoder/attn_layers.1/Softmax", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Where_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Softmax_output_0" + ], + "attrs": { + "axis": -1 + } + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.1/MatMul_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Softmax_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Transpose_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_9_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_88_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_9_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_10_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_89_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_10_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_11_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_11_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_90_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_11_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_91_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_28", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_7_output_0", + "onnx::Unsqueeze_2012" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_28_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_92_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_28_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_93_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_94_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_95_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_96_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_97_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_98_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_14_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_29", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_7_output_0", + "onnx::Unsqueeze_2029" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_29_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_99_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_29_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_100_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_101_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_102_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_103_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_104_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_105_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_15_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_14_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_12_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_12_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_106_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_12_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_107_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Gather_12_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_6_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_8_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_3_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_6_output_0", + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_16_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_16_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_108_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_11_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_11_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_110_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_111_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_109_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_112_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_6_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_6_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_113_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_12_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_12_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_7_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.1/Pad_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Softmax_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Cast_7_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_3_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Pow", + "name": "/text_encoder/attn_encoder/attn_layers.1/Pow", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_114_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pow_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.1/Mul_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Sub_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.1/Add_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pow_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Mul_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Add_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_30", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_9_output_0", + "onnx::Unsqueeze_2070" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_30_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_31", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_10_output_0", + "onnx::Unsqueeze_2072" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_31_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_32", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Add_3_output_0", + "onnx::Unsqueeze_2074" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_32_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_30_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_31_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_32_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_17_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_3_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Concat_17_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_13_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_33", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_11_output_0", + "onnx::Unsqueeze_2078" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_33_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_33_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_115_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_116_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_117_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_118_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_119_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_18_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_34", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_11_output_0", + "onnx::Unsqueeze_2091" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_34_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_34_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_120_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_121_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_122_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_123_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_124_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_19_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_18_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_13_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_13_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_125_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_13_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_126_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Gather_13_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_19_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_8_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_4_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_20", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_8_output_0", + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_20_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_20_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_127_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_14_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_14_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_129_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_130_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_128_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_131_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_7_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_7_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_132_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_15_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_9_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.1/Pad_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_13_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Cast_9_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_4_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.1/Mul_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_133_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Mul_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_35", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_9_output_0", + "onnx::Unsqueeze_2128" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_35_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_36", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_10_output_0", + "onnx::Unsqueeze_2130" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_36_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_37", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_11_output_0", + "onnx::Unsqueeze_2132" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_37_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_38", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Mul_4_output_0", + "onnx::Unsqueeze_2134" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_38_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_21", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_35_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_36_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_37_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_38_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_21_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_4_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Concat_21_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_16_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_16_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_135_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_136_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_134_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_137_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Shape_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_14_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.1/Gather_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Shape_14_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_138_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_14_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.1/Sub_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Constant_139_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Gather_14_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_10_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_5_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_22", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_10_output_0", + "/text_encoder/attn_encoder/attn_layers.1/ConstantOfShape_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_22_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_22_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_140_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_17_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_17_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_142_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_143_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_141_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_144_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_8_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_8_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_145_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_18_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.1/Cast_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_18_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Cast_11_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.1/Pad_5", + "inputs": [ + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.emb_rel_v", + "/text_encoder/attn_encoder/attn_layers.1/Cast_11_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_5_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_39", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_147_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_39_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_40", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Sub_2_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_148_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_40_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.1/Slice_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Pad_5_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_39_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_40_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_146_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_149_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_41", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_10_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Constant_150_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_41_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.1/MatMul_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Slice_8_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_41_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.1/Add_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/MatMul_2_output_0", + "/text_encoder/attn_encoder/attn_layers.1/MatMul_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Add_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.1/Transpose_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Add_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_9_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_42", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_output_0", + "onnx::Unsqueeze_2183" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_42_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_43", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_1_output_0", + "onnx::Unsqueeze_2185" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_43_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_44", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Gather_3_output_0", + "onnx::Unsqueeze_2187" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_44_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.1/Concat_23", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_42_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_43_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Unsqueeze_44_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Concat_23_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.1/Reshape_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Transpose_9_output_0", + "/text_encoder/attn_encoder/attn_layers.1/Concat_23_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_19_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.1/conv_o/Conv", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.1/Reshape_19_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_o.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.1.conv_o.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.1/conv_o/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/Add_2", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.0/Transpose_1_output_0", + "/text_encoder/attn_encoder/attn_layers.1/conv_o/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Add_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_1.1/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/Add_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.1/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/attn_encoder/norm_layers_1.1/norm/LayerNormalization", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.1/Transpose_output_0", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.1.norm.weight", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.1.norm.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.1/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_1.1/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.1/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.1/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.1/Mul", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.1/Transpose_1_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/ffn_layers.1/conv_1/Conv", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/Mul_output_0", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.1.conv_1.weight", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.1.conv_1.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/conv_1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Relu", + "name": "/text_encoder/attn_encoder/ffn_layers.1/Relu", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/conv_1/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/Relu_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.1/Mul_1", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/Relu_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/ffn_layers.1/conv_2/Conv", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/Mul_1_output_0", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.1.conv_2.weight", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.1.conv_2.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/conv_2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.1/Mul_2", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/conv_2/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.1/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/Add_3", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.1/Transpose_1_output_0", + "/text_encoder/attn_encoder/ffn_layers.1/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Add_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_2.1/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/Add_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.1/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/attn_encoder/norm_layers_2.1/norm/LayerNormalization", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.1/Transpose_output_0", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.1.norm.weight", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.1.norm.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.1/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_2.1/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.1/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.1/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.2/conv_q/Conv", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.1/Transpose_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_q.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_q.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_q/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.2/conv_k/Conv", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.1/Transpose_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_k.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_k.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_k/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.2/conv_v/Conv", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.1/Transpose_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_v.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_v.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_v/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_2_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_q/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_3_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_3_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_output_0", + "onnx::Unsqueeze_2221" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_3_output_0", + "onnx::Unsqueeze_2227" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_4_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_5_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_q/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Concat_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_output_0", + "onnx::Unsqueeze_2232" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_2_output_0", + "onnx::Unsqueeze_2238" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_2_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_6_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_output_0", + "onnx::Unsqueeze_2241" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_2_output_0", + "onnx::Unsqueeze_2247" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_4_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_8_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_9_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_k/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Concat_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_v/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Concat_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_2_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/attn_encoder/attn_layers.2/Div", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.2/MatMul", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Div_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_2_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_11_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_output_0" + ], + "attrs": {} + }, + { + "op_type": "Clip", + "name": "/text_encoder/attn_encoder/attn_layers.2/Clip", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_12_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_13_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Gather_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Clip", + "name": "/text_encoder/attn_encoder/attn_layers.2/Clip_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_14_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.2/Mul", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_2_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.2/Add", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Mul_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Add_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_16_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_output_0", + "onnx::Unsqueeze_2277" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_output_0", + "onnx::Unsqueeze_2279" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_17_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_18_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_6_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_19_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_20_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_3_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_output_0", + "onnx::Unsqueeze_2290" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_output_0", + "onnx::Unsqueeze_2292" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_21_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_22_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_8_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_9_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_23_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_24_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_4_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_output_0", + "onnx::Unsqueeze_2303" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_output_0", + "onnx::Unsqueeze_2305" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_11_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_25_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_26_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_10_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_11_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_27_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_28_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_5_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_output_0", + "onnx::Unsqueeze_2316" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_12_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_output_0", + "onnx::Unsqueeze_2318" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_13_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_29_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_30_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_12_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_13_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_31_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_32_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_6_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_4_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_33_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_4_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_34_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Gather_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_output_0", + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_7_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_35_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_3_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_3_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_37_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_38_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_36_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_39_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_2_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_2_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_40_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_4_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_1_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.2/Pad", + "inputs": [ + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.emb_rel_k", + "/text_encoder/attn_encoder/attn_layers.2/Cast_1_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_42_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_14_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_2_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_43_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_15_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_14_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_15_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_41_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_44_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_45_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_16_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_16_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_3_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.2/MatMul_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Div_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Transpose_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_5_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_46_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_5_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_6_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_47_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_6_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_48_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_7_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_49_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_1_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_50_output_0", + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_8_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_8_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_51_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_5_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_5_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_53_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_54_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_52_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_55_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_4_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_4_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_56_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_6_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_2_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.2/Pad_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Cast_2_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_1_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.2/Mul_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_57_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.2/Mul_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Mul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Gather_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_5_output_0", + "onnx::Unsqueeze_2394" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_17_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_6_output_0", + "onnx::Unsqueeze_2396" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_18_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Mul_2_output_0", + "onnx::Unsqueeze_2398" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_19_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_17_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_18_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_19_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_9_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Concat_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_7_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_58_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_20", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_4_output_0", + "onnx::Unsqueeze_2406" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_20_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_59_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_20_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_60_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_61_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_62_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_63_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_10_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_21", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_4_output_0", + "onnx::Unsqueeze_2419" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_21_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_64_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_21_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_65_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_66_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_67_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_68_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_11_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_8_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_69_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_8_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_70_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Gather_8_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_11_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_3_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_2_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_3_output_0", + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_12_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_12_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_71_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_8_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_8_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_73_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_74_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_72_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_75_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_5_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_5_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_76_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_9_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_4_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.2/Pad_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Cast_4_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_2_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.2/Add_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_77_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Add_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Mul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_78_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_22", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_5_output_0", + "onnx::Unsqueeze_2456" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_22_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_23", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_6_output_0", + "onnx::Unsqueeze_2458" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_23_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_24", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Add_1_output_0", + "onnx::Unsqueeze_2460" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_24_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_25", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_6_output_0", + "onnx::Unsqueeze_2462" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_25_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_22_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_23_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_24_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_25_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_13_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_2_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Concat_13_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_10_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_26", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_81_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_26_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_10_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_80_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_26_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_79_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_82_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_27", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_4_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_84_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_27_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_4_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_27_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_85_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_83_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_86_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.2/Add_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Slice_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Add_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Equal_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_5_output_0" + ], + "attrs": { + "to": 9 + } + }, + { + "op_type": "Where", + "name": "/text_encoder/attn_encoder/attn_layers.2/Where", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_5_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_87_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Add_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Where_output_0" + ], + "attrs": {} + }, + { + "op_type": "Softmax", + "name": "/text_encoder/attn_encoder/attn_layers.2/Softmax", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Where_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Softmax_output_0" + ], + "attrs": { + "axis": -1 + } + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.2/MatMul_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Softmax_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Transpose_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_9_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_88_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_9_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_10_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_89_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_10_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_11_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_11_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_90_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_11_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_91_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_28", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_7_output_0", + "onnx::Unsqueeze_2503" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_28_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_92_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_28_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_93_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_94_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_95_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_96_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_97_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_98_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_14_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_29", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_7_output_0", + "onnx::Unsqueeze_2520" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_29_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_99_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_29_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_100_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_101_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_102_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_103_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_104_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_105_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_15_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_14_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_12_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_12_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_106_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_12_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_107_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Gather_12_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_6_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_8_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_3_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_6_output_0", + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_16_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_16_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_108_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_11_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_11_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_110_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_111_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_109_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_112_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_6_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_6_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_113_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_12_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_12_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_7_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.2/Pad_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Softmax_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Cast_7_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_3_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Pow", + "name": "/text_encoder/attn_encoder/attn_layers.2/Pow", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_114_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pow_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.2/Mul_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Sub_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.2/Add_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pow_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Mul_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Add_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_30", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_9_output_0", + "onnx::Unsqueeze_2561" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_30_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_31", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_10_output_0", + "onnx::Unsqueeze_2563" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_31_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_32", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Add_3_output_0", + "onnx::Unsqueeze_2565" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_32_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_30_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_31_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_32_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_17_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_3_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Concat_17_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_13_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_33", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_11_output_0", + "onnx::Unsqueeze_2569" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_33_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_33_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_115_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_116_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_117_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_118_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_119_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_18_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_34", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_11_output_0", + "onnx::Unsqueeze_2582" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_34_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_34_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_120_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_121_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_122_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_123_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_124_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_19_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_18_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_13_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_13_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_125_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_13_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_126_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Gather_13_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_19_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_8_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_4_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_20", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_8_output_0", + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_20_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_20_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_127_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_14_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_14_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_129_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_130_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_128_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_131_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_7_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_7_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_132_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_15_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_9_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.2/Pad_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_13_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Cast_9_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_4_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.2/Mul_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_133_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Mul_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_35", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_9_output_0", + "onnx::Unsqueeze_2619" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_35_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_36", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_10_output_0", + "onnx::Unsqueeze_2621" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_36_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_37", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_11_output_0", + "onnx::Unsqueeze_2623" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_37_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_38", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Mul_4_output_0", + "onnx::Unsqueeze_2625" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_38_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_21", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_35_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_36_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_37_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_38_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_21_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_4_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Concat_21_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_16_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_16_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_135_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_136_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_134_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_137_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Shape_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_14_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.2/Gather_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Shape_14_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_138_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_14_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.2/Sub_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Constant_139_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Gather_14_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_10_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_5_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_22", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_10_output_0", + "/text_encoder/attn_encoder/attn_layers.2/ConstantOfShape_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_22_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_22_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_140_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_17_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_17_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_142_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_143_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_141_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_144_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_8_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_8_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_145_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_18_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.2/Cast_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_18_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Cast_11_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.2/Pad_5", + "inputs": [ + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.emb_rel_v", + "/text_encoder/attn_encoder/attn_layers.2/Cast_11_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_5_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_39", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_147_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_39_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_40", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Sub_2_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_148_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_40_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.2/Slice_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Pad_5_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_39_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_40_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_146_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_149_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_41", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_10_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Constant_150_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_41_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.2/MatMul_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Slice_8_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_41_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.2/Add_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/MatMul_2_output_0", + "/text_encoder/attn_encoder/attn_layers.2/MatMul_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Add_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.2/Transpose_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Add_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_9_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_42", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_output_0", + "onnx::Unsqueeze_2674" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_42_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_43", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_1_output_0", + "onnx::Unsqueeze_2676" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_43_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_44", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Gather_3_output_0", + "onnx::Unsqueeze_2678" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_44_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.2/Concat_23", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_42_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_43_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Unsqueeze_44_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Concat_23_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.2/Reshape_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Transpose_9_output_0", + "/text_encoder/attn_encoder/attn_layers.2/Concat_23_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_19_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.2/conv_o/Conv", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.2/Reshape_19_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_o.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.2.conv_o.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.2/conv_o/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/Add_4", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.1/Transpose_1_output_0", + "/text_encoder/attn_encoder/attn_layers.2/conv_o/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Add_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_1.2/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/Add_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.2/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/attn_encoder/norm_layers_1.2/norm/LayerNormalization", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.2/Transpose_output_0", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.2.norm.weight", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.2.norm.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.2/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_1.2/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.2/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.2/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.2/Mul", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.2/Transpose_1_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/ffn_layers.2/conv_1/Conv", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/Mul_output_0", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.2.conv_1.weight", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.2.conv_1.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/conv_1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Relu", + "name": "/text_encoder/attn_encoder/ffn_layers.2/Relu", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/conv_1/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/Relu_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.2/Mul_1", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/Relu_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/ffn_layers.2/conv_2/Conv", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/Mul_1_output_0", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.2.conv_2.weight", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.2.conv_2.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/conv_2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.2/Mul_2", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/conv_2/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.2/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/Add_5", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.2/Transpose_1_output_0", + "/text_encoder/attn_encoder/ffn_layers.2/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Add_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_2.2/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/Add_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.2/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/attn_encoder/norm_layers_2.2/norm/LayerNormalization", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.2/Transpose_output_0", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.2.norm.weight", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.2.norm.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.2/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_2.2/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.2/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.2/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.3/conv_q/Conv", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.2/Transpose_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_q.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_q.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_q/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.3/conv_k/Conv", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.2/Transpose_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_k.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_k.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_k/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.3/conv_v/Conv", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.2/Transpose_1_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_v.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_v.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_v/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_k/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_2_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_q/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_3_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_3_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_output_0", + "onnx::Unsqueeze_2712" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_3_output_0", + "onnx::Unsqueeze_2718" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_4_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_5_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_q/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Concat_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_output_0", + "onnx::Unsqueeze_2723" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_2_output_0", + "onnx::Unsqueeze_2729" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_2_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_6_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_output_0", + "onnx::Unsqueeze_2732" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_2_output_0", + "onnx::Unsqueeze_2738" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_4_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_8_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_9_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_k/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Concat_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_1_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_v/Conv_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Concat_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_2_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Div", + "name": "/text_encoder/attn_encoder/attn_layers.3/Div", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.3/MatMul", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Div_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Reshape_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_2_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_11_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_output_0" + ], + "attrs": {} + }, + { + "op_type": "Clip", + "name": "/text_encoder/attn_encoder/attn_layers.3/Clip", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_12_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_13_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Gather_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Clip", + "name": "/text_encoder/attn_encoder/attn_layers.3/Clip_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_14_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.3/Mul", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_2_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.3/Add", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Mul_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Add_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_16_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_output_0", + "onnx::Unsqueeze_2768" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_output_0", + "onnx::Unsqueeze_2770" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_17_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_18_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_6_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_19_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_20_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_3_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_output_0", + "onnx::Unsqueeze_2781" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_output_0", + "onnx::Unsqueeze_2783" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_21_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_22_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_8_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_9_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_23_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_24_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_4_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_output_0", + "onnx::Unsqueeze_2794" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_output_0", + "onnx::Unsqueeze_2796" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_11_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_25_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_26_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_10_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_11_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_27_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_28_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_5_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_output_0", + "onnx::Unsqueeze_2807" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_12_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_output_0", + "onnx::Unsqueeze_2809" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_13_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_29_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_30_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_12_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_13_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_31_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_32_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_6_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_4_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_33_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_4_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_34_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Gather_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_output_0", + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_7_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_35_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_3_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_3_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_37_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_38_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_36_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_39_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_2_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_2_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_40_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_4_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_1_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.3/Pad", + "inputs": [ + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.emb_rel_k", + "/text_encoder/attn_encoder/attn_layers.3/Cast_1_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_42_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_14_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_2_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_43_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_15_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_14_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_15_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_41_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_44_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_45_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_16_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_16_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_3_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.3/MatMul_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Div_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Transpose_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_5_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_46_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_5_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_6_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_47_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_6_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_48_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_7_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_49_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_1_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_50_output_0", + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_8_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_8_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_51_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_5_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_5_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_53_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_54_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_52_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_55_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_4_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_4_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_56_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_6_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_2_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.3/Pad_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Cast_2_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_1_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.3/Mul_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_57_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.3/Mul_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Mul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Gather_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_5_output_0", + "onnx::Unsqueeze_2885" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_17_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_6_output_0", + "onnx::Unsqueeze_2887" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_18_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Mul_2_output_0", + "onnx::Unsqueeze_2889" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_19_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_17_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_18_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_19_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_9_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Concat_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_7_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_58_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_20", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_4_output_0", + "onnx::Unsqueeze_2897" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_20_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_59_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_20_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_60_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_61_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_62_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_63_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_10_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_21", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_4_output_0", + "onnx::Unsqueeze_2910" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_21_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_64_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_21_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_65_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_66_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_67_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_68_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_11_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_8_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_69_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_8_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_70_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Gather_8_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_11_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_3_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_2_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_3_output_0", + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_12_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_12_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_71_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_8_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_8_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_73_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_74_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_72_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_75_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_5_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_5_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_76_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_9_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_4_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.3/Pad_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Cast_4_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_2_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.3/Add_1", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_77_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Add_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Mul_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_78_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_22", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_5_output_0", + "onnx::Unsqueeze_2947" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_22_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_23", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_6_output_0", + "onnx::Unsqueeze_2949" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_23_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_24", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Add_1_output_0", + "onnx::Unsqueeze_2951" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_24_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_25", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_6_output_0", + "onnx::Unsqueeze_2953" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_25_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_22_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_23_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_24_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_25_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_13_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_2_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Concat_13_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_10_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_26", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_81_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_26_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_10_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_80_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_26_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_79_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_82_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_27", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_4_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_84_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_27_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_4_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_27_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_85_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_83_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_86_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.3/Add_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Slice_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Add_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.0/Equal_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_5_output_0" + ], + "attrs": { + "to": 9 + } + }, + { + "op_type": "Where", + "name": "/text_encoder/attn_encoder/attn_layers.3/Where", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_5_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_87_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Add_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Where_output_0" + ], + "attrs": {} + }, + { + "op_type": "Softmax", + "name": "/text_encoder/attn_encoder/attn_layers.3/Softmax", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Where_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Softmax_output_0" + ], + "attrs": { + "axis": -1 + } + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.3/MatMul_2", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Softmax_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Transpose_1_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_9_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_88_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_9_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_10_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_89_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_10_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Softmax_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_11_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_11_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_90_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_11_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_91_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_28", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_7_output_0", + "onnx::Unsqueeze_2994" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_28_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_92_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_28_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_93_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_94_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_95_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_96_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_97_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_98_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_14_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_29", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_7_output_0", + "onnx::Unsqueeze_3011" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_29_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_99_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_29_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_100_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_101_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_102_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_103_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_104_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_105_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_15_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_14_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_12_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_12_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_106_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_12_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_107_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Gather_12_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_6_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_8_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_3_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_6_output_0", + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_16_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_16_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_108_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_11_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_11_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_110_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_111_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_109_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_112_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose_6", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_6_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_12", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_6_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_113_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_12_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_12_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_7_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.3/Pad_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Softmax_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Cast_7_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_3_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Pow", + "name": "/text_encoder/attn_encoder/attn_layers.3/Pow", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_114_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pow_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.3/Mul_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Sub_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Mul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.3/Add_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pow_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Mul_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Add_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_30", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_9_output_0", + "onnx::Unsqueeze_3052" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_30_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_31", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_10_output_0", + "onnx::Unsqueeze_3054" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_31_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_32", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Add_3_output_0", + "onnx::Unsqueeze_3056" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_32_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_30_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_31_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_32_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_17_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_3_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Concat_17_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_13_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_33", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_11_output_0", + "onnx::Unsqueeze_3060" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_33_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_33_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_115_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_116_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_117_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_118_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_119_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_18_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_34", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_11_output_0", + "onnx::Unsqueeze_3073" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_34_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_34_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_120_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_121_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_122_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_123_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_124_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_19_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_18_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_13_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_13", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_13_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_125_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_13_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_126_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Gather_13_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_19_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_8_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_4_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_20", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_8_output_0", + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_20_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_20_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_127_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_14_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_14_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_129_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_130_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_128_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_131_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose_7", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_7_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_15", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_7_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_132_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_15_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_15_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_9_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.3/Pad_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_13_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Cast_9_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_4_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/attn_layers.3/Mul_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_11_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_133_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Mul_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_35", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_9_output_0", + "onnx::Unsqueeze_3110" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_35_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_36", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_10_output_0", + "onnx::Unsqueeze_3112" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_36_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_37", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_11_output_0", + "onnx::Unsqueeze_3114" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_37_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_38", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Mul_4_output_0", + "onnx::Unsqueeze_3116" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_38_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_21", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_35_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_36_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_37_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_38_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_21_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_16", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_4_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Concat_21_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_16_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_16_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_135_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_136_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_134_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_137_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_8_output_0" + ], + "attrs": {} + }, + { + "op_type": "Shape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Shape_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_14_output_0" + ], + "attrs": {} + }, + { + "op_type": "Gather", + "name": "/text_encoder/attn_encoder/attn_layers.3/Gather_14", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Shape_14_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_138_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_14_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Sub", + "name": "/text_encoder/attn_encoder/attn_layers.3/Sub_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Constant_139_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Gather_14_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_10_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "ConstantOfShape", + "name": "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_5", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_10_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_5_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 0 + ] + } + } + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_22", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_10_output_0", + "/text_encoder/attn_encoder/attn_layers.3/ConstantOfShape_5_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_22_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_17", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_22_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_140_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_17_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_17_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_142_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_143_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_141_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_144_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_9_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose_8", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_9_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_8_output_0" + ], + "attrs": { + "perm": [ + 1, + 0 + ] + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_18", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_8_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_145_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_18_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Cast", + "name": "/text_encoder/attn_encoder/attn_layers.3/Cast_11", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_18_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Cast_11_output_0" + ], + "attrs": { + "to": 7 + } + }, + { + "op_type": "Pad", + "name": "/text_encoder/attn_encoder/attn_layers.3/Pad_5", + "inputs": [ + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.emb_rel_v", + "/text_encoder/attn_encoder/attn_layers.3/Cast_11_output_0", + "" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_5_output_0" + ], + "attrs": { + "mode": "constant" + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_39", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Clip_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_147_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_39_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_40", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Sub_2_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_148_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_40_output_0" + ], + "attrs": {} + }, + { + "op_type": "Slice", + "name": "/text_encoder/attn_encoder/attn_layers.3/Slice_10", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Pad_5_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_39_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_40_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_146_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_149_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_10_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_41", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_10_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Constant_150_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_41_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/text_encoder/attn_encoder/attn_layers.3/MatMul_3", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Slice_8_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_41_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/attn_layers.3/Add_4", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/MatMul_2_output_0", + "/text_encoder/attn_encoder/attn_layers.3/MatMul_3_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Add_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/attn_layers.3/Transpose_9", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Add_4_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_9_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_42", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_output_0", + "onnx::Unsqueeze_3165" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_42_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_43", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_1_output_0", + "onnx::Unsqueeze_3167" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_43_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_44", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Gather_3_output_0", + "onnx::Unsqueeze_3169" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_44_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/text_encoder/attn_encoder/attn_layers.3/Concat_23", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_42_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_43_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Unsqueeze_44_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Concat_23_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Reshape", + "name": "/text_encoder/attn_encoder/attn_layers.3/Reshape_19", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Transpose_9_output_0", + "/text_encoder/attn_encoder/attn_layers.3/Concat_23_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_19_output_0" + ], + "attrs": { + "allowzero": 0 + } + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/attn_layers.3/conv_o/Conv", + "inputs": [ + "/text_encoder/attn_encoder/attn_layers.3/Reshape_19_output_0", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_o.weight", + "tts.ttl.text_encoder.attn_encoder.attn_layers.3.conv_o.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/attn_layers.3/conv_o/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/Add_6", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.2/Transpose_1_output_0", + "/text_encoder/attn_encoder/attn_layers.3/conv_o/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Add_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_1.3/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/Add_6_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.3/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/attn_encoder/norm_layers_1.3/norm/LayerNormalization", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.3/Transpose_output_0", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.3.norm.weight", + "tts.ttl.text_encoder.attn_encoder.norm_layers_1.3.norm.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.3/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_1.3/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.3/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_1.3/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.3/Mul", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.3/Transpose_1_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/ffn_layers.3/conv_1/Conv", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/Mul_output_0", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.3.conv_1.weight", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.3.conv_1.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/conv_1/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Relu", + "name": "/text_encoder/attn_encoder/ffn_layers.3/Relu", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/conv_1/Conv_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/Relu_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.3/Mul_1", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/Relu_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/Mul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Conv", + "name": "/text_encoder/attn_encoder/ffn_layers.3/conv_2/Conv", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/Mul_1_output_0", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.3.conv_2.weight", + "tts.ttl.text_encoder.attn_encoder.ffn_layers.3.conv_2.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/conv_2/Conv_output_0" + ], + "attrs": { + "dilations": [ + 1 + ], + "group": 1, + "kernel_shape": [ + 1 + ], + "pads": [ + 0, + 0 + ], + "strides": [ + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/ffn_layers.3/Mul_2", + "inputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/conv_2/Conv_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/ffn_layers.3/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/attn_encoder/Add_7", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_1.3/Transpose_1_output_0", + "/text_encoder/attn_encoder/ffn_layers.3/Mul_2_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/Add_7_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_2.3/Transpose", + "inputs": [ + "/text_encoder/attn_encoder/Add_7_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.3/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "LayerNormalization", + "name": "/text_encoder/attn_encoder/norm_layers_2.3/norm/LayerNormalization", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.3/Transpose_output_0", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.3.norm.weight", + "tts.ttl.text_encoder.attn_encoder.norm_layers_2.3.norm.bias" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.3/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/text_encoder/attn_encoder/norm_layers_2.3/Transpose_1", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.3/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/text_encoder/attn_encoder/norm_layers_2.3/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/text_encoder/attn_encoder/Mul_2", + "inputs": [ + "/text_encoder/attn_encoder/norm_layers_2.3/Transpose_1_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/attn_encoder/Mul_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/text_encoder/Add", + "inputs": [ + "/text_encoder/attn_encoder/Mul_2_output_0", + "/text_encoder/convnext/convnext.5/Mul_3_output_0" + ], + "outputs": [ + "/text_encoder/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/text_encoder/proj_out/Mul", + "inputs": [ + "/text_encoder/Add_output_0", + "text_mask" + ], + "outputs": [ + "/text_encoder/proj_out/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "ConstantOfShape", + "name": "/ConstantOfShape", + "inputs": [ + "/Constant_output_0" + ], + "outputs": [ + "/ConstantOfShape_output_0" + ], + "attrs": { + "value": { + "dtype": "int64", + "shape": [ + 1 + ], + "data": [ + 1 + ] + } + } + }, + { + "op_type": "Expand", + "name": "/Expand", + "inputs": [ + "tts.ttl.style_encoder.style_token_layer.style_key", + "/ConstantOfShape_output_0" + ], + "outputs": [ + "/Expand_output_0" + ], + "attrs": {} + }, + { + "op_type": "Tile", + "name": "/Tile", + "inputs": [ + "/Expand_output_0", + "onnx::Tile_3191" + ], + "outputs": [ + "/Tile_output_0" + ], + "attrs": {} + }, + { + "op_type": "Transpose", + "name": "/speech_prompted_text_encoder/Transpose", + "inputs": [ + "/text_encoder/proj_out/Mul_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Transpose", + "name": "/speech_prompted_text_encoder/Transpose_1", + "inputs": [ + "text_mask" + ], + "outputs": [ + "/speech_prompted_text_encoder/Transpose_1_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention1/W_query/linear/MatMul", + "inputs": [ + "/speech_prompted_text_encoder/Transpose_output_0", + "onnx::MatMul_3680" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/W_query/linear/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/attention1/W_query/linear/Add", + "inputs": [ + "tts.ttl.speech_prompted_text_encoder.attention1.W_query.linear.bias", + "/speech_prompted_text_encoder/attention1/W_query/linear/MatMul_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/W_query/linear/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention1/W_key/linear/MatMul", + "inputs": [ + "/Tile_output_0", + "onnx::MatMul_3681" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/W_key/linear/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/attention1/W_key/linear/Add", + "inputs": [ + "tts.ttl.speech_prompted_text_encoder.attention1.W_key.linear.bias", + "/speech_prompted_text_encoder/attention1/W_key/linear/MatMul_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/W_key/linear/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention1/W_value/linear/MatMul", + "inputs": [ + "style_ttl", + "onnx::MatMul_3682" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/W_value/linear/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/attention1/W_value/linear/Add", + "inputs": [ + "tts.ttl.speech_prompted_text_encoder.attention1.W_value.linear.bias", + "/speech_prompted_text_encoder/attention1/W_value/linear/MatMul_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/W_value/linear/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Split", + "name": "/speech_prompted_text_encoder/attention1/Split", + "inputs": [ + "/speech_prompted_text_encoder/attention1/W_query/linear/Add_output_0", + "/speech_prompted_text_encoder/attention1/Constant_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Split_output_0", + "/speech_prompted_text_encoder/attention1/Split_output_1" + ], + "attrs": { + "axis": 2 + } + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention1/Unsqueeze", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Split_output_0", + "/speech_prompted_text_encoder/attention1/Constant_1_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention1/Unsqueeze_1", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Split_output_1", + "/speech_prompted_text_encoder/attention1/Constant_2_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/speech_prompted_text_encoder/attention1/Concat", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_output_0", + "/speech_prompted_text_encoder/attention1/Unsqueeze_1_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Split", + "name": "/speech_prompted_text_encoder/attention1/Split_1", + "inputs": [ + "/speech_prompted_text_encoder/attention1/W_key/linear/Add_output_0", + "/speech_prompted_text_encoder/attention1/Constant_3_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Split_1_output_0", + "/speech_prompted_text_encoder/attention1/Split_1_output_1" + ], + "attrs": { + "axis": 2 + } + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention1/Unsqueeze_2", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Split_1_output_0", + "/speech_prompted_text_encoder/attention1/Constant_4_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention1/Unsqueeze_3", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Split_1_output_1", + "/speech_prompted_text_encoder/attention1/Constant_5_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/speech_prompted_text_encoder/attention1/Concat_1", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_2_output_0", + "/speech_prompted_text_encoder/attention1/Unsqueeze_3_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Concat_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Split", + "name": "/speech_prompted_text_encoder/attention1/Split_2", + "inputs": [ + "/speech_prompted_text_encoder/attention1/W_value/linear/Add_output_0", + "/speech_prompted_text_encoder/attention1/Constant_6_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Split_2_output_0", + "/speech_prompted_text_encoder/attention1/Split_2_output_1" + ], + "attrs": { + "axis": 2 + } + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention1/Unsqueeze_4", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Split_2_output_0", + "/speech_prompted_text_encoder/attention1/Constant_7_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention1/Unsqueeze_5", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Split_2_output_1", + "/speech_prompted_text_encoder/attention1/Constant_8_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/speech_prompted_text_encoder/attention1/Concat_2", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_4_output_0", + "/speech_prompted_text_encoder/attention1/Unsqueeze_5_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Concat_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Transpose", + "name": "/speech_prompted_text_encoder/attention1/Transpose", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Concat_1_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Tanh", + "name": "/speech_prompted_text_encoder/attention1/tanh/Tanh", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Transpose_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/tanh/Tanh_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention1/MatMul", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Concat_output_0", + "/speech_prompted_text_encoder/attention1/tanh/Tanh_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Div", + "name": "/speech_prompted_text_encoder/attention1/Div", + "inputs": [ + "/speech_prompted_text_encoder/attention1/MatMul_output_0", + "/speech_prompted_text_encoder/attention1/Constant_9_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "Softmax", + "name": "/speech_prompted_text_encoder/attention1/Softmax", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Div_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Softmax_output_0" + ], + "attrs": { + "axis": 3 + } + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention1/Unsqueeze_6", + "inputs": [ + "/speech_prompted_text_encoder/Transpose_1_output_0", + "/speech_prompted_text_encoder/attention1/Constant_10_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_6_output_0" + ], + "attrs": {} + }, + { + "op_type": "Equal", + "name": "/speech_prompted_text_encoder/attention1/Equal", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Unsqueeze_6_output_0", + "/speech_prompted_text_encoder/attention1/Constant_11_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Equal_output_0" + ], + "attrs": {} + }, + { + "op_type": "Cast", + "name": "/speech_prompted_text_encoder/attention1/Cast", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Equal_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Cast_output_0" + ], + "attrs": { + "to": 9 + } + }, + { + "op_type": "Where", + "name": "/speech_prompted_text_encoder/attention1/Where", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Cast_output_0", + "/speech_prompted_text_encoder/attention1/Constant_12_output_0", + "/speech_prompted_text_encoder/attention1/Softmax_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Where_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention1/MatMul_1", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Where_output_0", + "/speech_prompted_text_encoder/attention1/Concat_2_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/MatMul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Split", + "name": "/speech_prompted_text_encoder/attention1/Split_3", + "inputs": [ + "/speech_prompted_text_encoder/attention1/MatMul_1_output_0", + "/speech_prompted_text_encoder/attention1/Constant_13_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Split_3_output_0", + "/speech_prompted_text_encoder/attention1/Split_3_output_1" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Concat", + "name": "/speech_prompted_text_encoder/attention1/Concat_3", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Split_3_output_0", + "/speech_prompted_text_encoder/attention1/Split_3_output_1" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Concat_3_output_0" + ], + "attrs": { + "axis": 3 + } + }, + { + "op_type": "Squeeze", + "name": "/speech_prompted_text_encoder/attention1/Squeeze", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Concat_3_output_0", + "/speech_prompted_text_encoder/attention1/Constant_14_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Squeeze_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention1/out_fc/linear/MatMul", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Squeeze_output_0", + "onnx::MatMul_3683" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/out_fc/linear/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/attention1/out_fc/linear/Add", + "inputs": [ + "tts.ttl.speech_prompted_text_encoder.attention1.out_fc.linear.bias", + "/speech_prompted_text_encoder/attention1/out_fc/linear/MatMul_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/out_fc/linear/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/speech_prompted_text_encoder/attention1/Mul", + "inputs": [ + "/speech_prompted_text_encoder/attention1/out_fc/linear/Add_output_0", + "/speech_prompted_text_encoder/Transpose_1_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention1/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/Add", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Mul_output_0", + "/speech_prompted_text_encoder/Transpose_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention2/W_query/linear/MatMul", + "inputs": [ + "/speech_prompted_text_encoder/Add_output_0", + "onnx::MatMul_3684" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/W_query/linear/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/attention2/W_query/linear/Add", + "inputs": [ + "tts.ttl.speech_prompted_text_encoder.attention2.W_query.linear.bias", + "/speech_prompted_text_encoder/attention2/W_query/linear/MatMul_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/W_query/linear/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention2/W_key/linear/MatMul", + "inputs": [ + "/Tile_output_0", + "onnx::MatMul_3685" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/W_key/linear/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/attention2/W_key/linear/Add", + "inputs": [ + "tts.ttl.speech_prompted_text_encoder.attention2.W_key.linear.bias", + "/speech_prompted_text_encoder/attention2/W_key/linear/MatMul_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/W_key/linear/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention2/W_value/linear/MatMul", + "inputs": [ + "style_ttl", + "onnx::MatMul_3686" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/W_value/linear/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/attention2/W_value/linear/Add", + "inputs": [ + "tts.ttl.speech_prompted_text_encoder.attention2.W_value.linear.bias", + "/speech_prompted_text_encoder/attention2/W_value/linear/MatMul_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/W_value/linear/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Split", + "name": "/speech_prompted_text_encoder/attention2/Split", + "inputs": [ + "/speech_prompted_text_encoder/attention2/W_query/linear/Add_output_0", + "/speech_prompted_text_encoder/attention2/Constant_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Split_output_0", + "/speech_prompted_text_encoder/attention2/Split_output_1" + ], + "attrs": { + "axis": 2 + } + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention2/Unsqueeze", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Split_output_0", + "/speech_prompted_text_encoder/attention2/Constant_1_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Unsqueeze_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention2/Unsqueeze_1", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Split_output_1", + "/speech_prompted_text_encoder/attention2/Constant_2_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Unsqueeze_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/speech_prompted_text_encoder/attention2/Concat", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Unsqueeze_output_0", + "/speech_prompted_text_encoder/attention2/Unsqueeze_1_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Concat_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Split", + "name": "/speech_prompted_text_encoder/attention2/Split_1", + "inputs": [ + "/speech_prompted_text_encoder/attention2/W_key/linear/Add_output_0", + "/speech_prompted_text_encoder/attention2/Constant_3_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Split_1_output_0", + "/speech_prompted_text_encoder/attention2/Split_1_output_1" + ], + "attrs": { + "axis": 2 + } + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention2/Unsqueeze_2", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Split_1_output_0", + "/speech_prompted_text_encoder/attention2/Constant_4_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Unsqueeze_2_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention2/Unsqueeze_3", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Split_1_output_1", + "/speech_prompted_text_encoder/attention2/Constant_5_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Unsqueeze_3_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/speech_prompted_text_encoder/attention2/Concat_1", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Unsqueeze_2_output_0", + "/speech_prompted_text_encoder/attention2/Unsqueeze_3_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Concat_1_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Split", + "name": "/speech_prompted_text_encoder/attention2/Split_2", + "inputs": [ + "/speech_prompted_text_encoder/attention2/W_value/linear/Add_output_0", + "/speech_prompted_text_encoder/attention2/Constant_6_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Split_2_output_0", + "/speech_prompted_text_encoder/attention2/Split_2_output_1" + ], + "attrs": { + "axis": 2 + } + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention2/Unsqueeze_4", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Split_2_output_0", + "/speech_prompted_text_encoder/attention2/Constant_7_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Unsqueeze_4_output_0" + ], + "attrs": {} + }, + { + "op_type": "Unsqueeze", + "name": "/speech_prompted_text_encoder/attention2/Unsqueeze_5", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Split_2_output_1", + "/speech_prompted_text_encoder/attention2/Constant_8_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Unsqueeze_5_output_0" + ], + "attrs": {} + }, + { + "op_type": "Concat", + "name": "/speech_prompted_text_encoder/attention2/Concat_2", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Unsqueeze_4_output_0", + "/speech_prompted_text_encoder/attention2/Unsqueeze_5_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Concat_2_output_0" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Transpose", + "name": "/speech_prompted_text_encoder/attention2/Transpose", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Concat_1_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 1, + 3, + 2 + ] + } + }, + { + "op_type": "Tanh", + "name": "/speech_prompted_text_encoder/attention2/tanh/Tanh", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Transpose_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/tanh/Tanh_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention2/MatMul", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Concat_output_0", + "/speech_prompted_text_encoder/attention2/tanh/Tanh_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Div", + "name": "/speech_prompted_text_encoder/attention2/Div", + "inputs": [ + "/speech_prompted_text_encoder/attention2/MatMul_output_0", + "/speech_prompted_text_encoder/attention2/Constant_9_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Div_output_0" + ], + "attrs": {} + }, + { + "op_type": "Softmax", + "name": "/speech_prompted_text_encoder/attention2/Softmax", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Div_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Softmax_output_0" + ], + "attrs": { + "axis": 3 + } + }, + { + "op_type": "Cast", + "name": "/speech_prompted_text_encoder/attention2/Cast", + "inputs": [ + "/speech_prompted_text_encoder/attention1/Equal_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Cast_output_0" + ], + "attrs": { + "to": 9 + } + }, + { + "op_type": "Where", + "name": "/speech_prompted_text_encoder/attention2/Where", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Cast_output_0", + "/speech_prompted_text_encoder/attention2/Constant_10_output_0", + "/speech_prompted_text_encoder/attention2/Softmax_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Where_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention2/MatMul_1", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Where_output_0", + "/speech_prompted_text_encoder/attention2/Concat_2_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/MatMul_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "Split", + "name": "/speech_prompted_text_encoder/attention2/Split_3", + "inputs": [ + "/speech_prompted_text_encoder/attention2/MatMul_1_output_0", + "/speech_prompted_text_encoder/attention2/Constant_11_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Split_3_output_0", + "/speech_prompted_text_encoder/attention2/Split_3_output_1" + ], + "attrs": { + "axis": 0 + } + }, + { + "op_type": "Concat", + "name": "/speech_prompted_text_encoder/attention2/Concat_3", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Split_3_output_0", + "/speech_prompted_text_encoder/attention2/Split_3_output_1" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Concat_3_output_0" + ], + "attrs": { + "axis": 3 + } + }, + { + "op_type": "Squeeze", + "name": "/speech_prompted_text_encoder/attention2/Squeeze", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Concat_3_output_0", + "/speech_prompted_text_encoder/attention2/Constant_12_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Squeeze_output_0" + ], + "attrs": {} + }, + { + "op_type": "MatMul", + "name": "/speech_prompted_text_encoder/attention2/out_fc/linear/MatMul", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Squeeze_output_0", + "onnx::MatMul_3687" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/out_fc/linear/MatMul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/attention2/out_fc/linear/Add", + "inputs": [ + "tts.ttl.speech_prompted_text_encoder.attention2.out_fc.linear.bias", + "/speech_prompted_text_encoder/attention2/out_fc/linear/MatMul_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/out_fc/linear/Add_output_0" + ], + "attrs": {} + }, + { + "op_type": "Mul", + "name": "/speech_prompted_text_encoder/attention2/Mul", + "inputs": [ + "/speech_prompted_text_encoder/attention2/out_fc/linear/Add_output_0", + "/speech_prompted_text_encoder/Transpose_1_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/attention2/Mul_output_0" + ], + "attrs": {} + }, + { + "op_type": "Add", + "name": "/speech_prompted_text_encoder/Add_1", + "inputs": [ + "/speech_prompted_text_encoder/attention2/Mul_output_0", + "/speech_prompted_text_encoder/Transpose_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/Add_1_output_0" + ], + "attrs": {} + }, + { + "op_type": "LayerNormalization", + "name": "/speech_prompted_text_encoder/norm/norm/LayerNormalization", + "inputs": [ + "/speech_prompted_text_encoder/Add_1_output_0", + "tts.ttl.speech_prompted_text_encoder.norm.norm.weight", + "tts.ttl.speech_prompted_text_encoder.norm.norm.bias" + ], + "outputs": [ + "/speech_prompted_text_encoder/norm/norm/LayerNormalization_output_0" + ], + "attrs": { + "axis": -1, + "epsilon": 9.999999974752427e-07 + } + }, + { + "op_type": "Transpose", + "name": "/speech_prompted_text_encoder/norm/Transpose", + "inputs": [ + "/speech_prompted_text_encoder/norm/norm/LayerNormalization_output_0" + ], + "outputs": [ + "/speech_prompted_text_encoder/norm/Transpose_output_0" + ], + "attrs": { + "perm": [ + 0, + 2, + 1 + ] + } + }, + { + "op_type": "Mul", + "name": "/speech_prompted_text_encoder/Mul", + "inputs": [ + "/speech_prompted_text_encoder/norm/Transpose_output_0", + "text_mask" + ], + "outputs": [ + "text_emb" + ], + "attrs": {} + } + ] +} \ No newline at end of file