supertonic-3 / graphs /vocoder.json
ailuntz's picture
Add Supertonic 3 MLX metadata and graph topology
100bd71 verified
{
"ir_version": 9,
"opsets": [
{
"domain": "",
"version": 19
}
],
"inputs": [
"latent"
],
"outputs": [
"wav_tts"
],
"weight_map": {
"tts.ttl.normalizer.scale": "w000000",
"tts.ae.latent_mean": "w000001",
"tts.ae.latent_std": "w000002",
"tts.ae.decoder.convnext.0.gamma": "w000003",
"tts.ae.decoder.convnext.0.dwconv.net.weight": "w000004",
"tts.ae.decoder.convnext.0.dwconv.net.bias": "w000005",
"tts.ae.decoder.convnext.0.norm.norm.weight": "w000006",
"tts.ae.decoder.convnext.0.norm.norm.bias": "w000007",
"tts.ae.decoder.convnext.0.pwconv1.weight": "w000008",
"tts.ae.decoder.convnext.0.pwconv1.bias": "w000009",
"tts.ae.decoder.convnext.0.pwconv2.weight": "w000010",
"tts.ae.decoder.convnext.0.pwconv2.bias": "w000011",
"tts.ae.decoder.convnext.1.gamma": "w000012",
"tts.ae.decoder.convnext.1.dwconv.net.weight": "w000013",
"tts.ae.decoder.convnext.1.dwconv.net.bias": "w000014",
"tts.ae.decoder.convnext.1.norm.norm.weight": "w000015",
"tts.ae.decoder.convnext.1.norm.norm.bias": "w000016",
"tts.ae.decoder.convnext.1.pwconv1.weight": "w000017",
"tts.ae.decoder.convnext.1.pwconv1.bias": "w000018",
"tts.ae.decoder.convnext.1.pwconv2.weight": "w000019",
"tts.ae.decoder.convnext.1.pwconv2.bias": "w000020",
"tts.ae.decoder.convnext.2.gamma": "w000021",
"tts.ae.decoder.convnext.2.dwconv.net.weight": "w000022",
"tts.ae.decoder.convnext.2.dwconv.net.bias": "w000023",
"tts.ae.decoder.convnext.2.norm.norm.weight": "w000024",
"tts.ae.decoder.convnext.2.norm.norm.bias": "w000025",
"tts.ae.decoder.convnext.2.pwconv1.weight": "w000026",
"tts.ae.decoder.convnext.2.pwconv1.bias": "w000027",
"tts.ae.decoder.convnext.2.pwconv2.weight": "w000028",
"tts.ae.decoder.convnext.2.pwconv2.bias": "w000029",
"tts.ae.decoder.convnext.3.gamma": "w000030",
"tts.ae.decoder.convnext.3.dwconv.net.weight": "w000031",
"tts.ae.decoder.convnext.3.dwconv.net.bias": "w000032",
"tts.ae.decoder.convnext.3.norm.norm.weight": "w000033",
"tts.ae.decoder.convnext.3.norm.norm.bias": "w000034",
"tts.ae.decoder.convnext.3.pwconv1.weight": "w000035",
"tts.ae.decoder.convnext.3.pwconv1.bias": "w000036",
"tts.ae.decoder.convnext.3.pwconv2.weight": "w000037",
"tts.ae.decoder.convnext.3.pwconv2.bias": "w000038",
"tts.ae.decoder.convnext.4.gamma": "w000039",
"tts.ae.decoder.convnext.4.dwconv.net.weight": "w000040",
"tts.ae.decoder.convnext.4.dwconv.net.bias": "w000041",
"tts.ae.decoder.convnext.4.norm.norm.weight": "w000042",
"tts.ae.decoder.convnext.4.norm.norm.bias": "w000043",
"tts.ae.decoder.convnext.4.pwconv1.weight": "w000044",
"tts.ae.decoder.convnext.4.pwconv1.bias": "w000045",
"tts.ae.decoder.convnext.4.pwconv2.weight": "w000046",
"tts.ae.decoder.convnext.4.pwconv2.bias": "w000047",
"tts.ae.decoder.convnext.5.gamma": "w000048",
"tts.ae.decoder.convnext.5.dwconv.net.weight": "w000049",
"tts.ae.decoder.convnext.5.dwconv.net.bias": "w000050",
"tts.ae.decoder.convnext.5.norm.norm.weight": "w000051",
"tts.ae.decoder.convnext.5.norm.norm.bias": "w000052",
"tts.ae.decoder.convnext.5.pwconv1.weight": "w000053",
"tts.ae.decoder.convnext.5.pwconv1.bias": "w000054",
"tts.ae.decoder.convnext.5.pwconv2.weight": "w000055",
"tts.ae.decoder.convnext.5.pwconv2.bias": "w000056",
"tts.ae.decoder.convnext.6.gamma": "w000057",
"tts.ae.decoder.convnext.6.dwconv.net.weight": "w000058",
"tts.ae.decoder.convnext.6.dwconv.net.bias": "w000059",
"tts.ae.decoder.convnext.6.norm.norm.weight": "w000060",
"tts.ae.decoder.convnext.6.norm.norm.bias": "w000061",
"tts.ae.decoder.convnext.6.pwconv1.weight": "w000062",
"tts.ae.decoder.convnext.6.pwconv1.bias": "w000063",
"tts.ae.decoder.convnext.6.pwconv2.weight": "w000064",
"tts.ae.decoder.convnext.6.pwconv2.bias": "w000065",
"tts.ae.decoder.convnext.7.gamma": "w000066",
"tts.ae.decoder.convnext.7.dwconv.net.weight": "w000067",
"tts.ae.decoder.convnext.7.dwconv.net.bias": "w000068",
"tts.ae.decoder.convnext.7.norm.norm.weight": "w000069",
"tts.ae.decoder.convnext.7.norm.norm.bias": "w000070",
"tts.ae.decoder.convnext.7.pwconv1.weight": "w000071",
"tts.ae.decoder.convnext.7.pwconv1.bias": "w000072",
"tts.ae.decoder.convnext.7.pwconv2.weight": "w000073",
"tts.ae.decoder.convnext.7.pwconv2.bias": "w000074",
"tts.ae.decoder.convnext.8.gamma": "w000075",
"tts.ae.decoder.convnext.8.dwconv.net.weight": "w000076",
"tts.ae.decoder.convnext.8.dwconv.net.bias": "w000077",
"tts.ae.decoder.convnext.8.norm.norm.weight": "w000078",
"tts.ae.decoder.convnext.8.norm.norm.bias": "w000079",
"tts.ae.decoder.convnext.8.pwconv1.weight": "w000080",
"tts.ae.decoder.convnext.8.pwconv1.bias": "w000081",
"tts.ae.decoder.convnext.8.pwconv2.weight": "w000082",
"tts.ae.decoder.convnext.8.pwconv2.bias": "w000083",
"tts.ae.decoder.convnext.9.gamma": "w000084",
"tts.ae.decoder.convnext.9.dwconv.net.weight": "w000085",
"tts.ae.decoder.convnext.9.dwconv.net.bias": "w000086",
"tts.ae.decoder.convnext.9.norm.norm.weight": "w000087",
"tts.ae.decoder.convnext.9.norm.norm.bias": "w000088",
"tts.ae.decoder.convnext.9.pwconv1.weight": "w000089",
"tts.ae.decoder.convnext.9.pwconv1.bias": "w000090",
"tts.ae.decoder.convnext.9.pwconv2.weight": "w000091",
"tts.ae.decoder.convnext.9.pwconv2.bias": "w000092",
"tts.ae.decoder.final_norm.norm.weight": "w000093",
"tts.ae.decoder.final_norm.norm.bias": "w000094",
"tts.ae.decoder.final_norm.norm.running_mean": "w000095",
"tts.ae.decoder.final_norm.norm.running_var": "w000096",
"tts.ae.decoder.head.layer1.net.weight": "w000097",
"tts.ae.decoder.head.layer1.net.bias": "w000098",
"tts.ae.decoder.head.layer2.weight": "w000099",
"onnx::Conv_1441": "w000100",
"onnx::Conv_1442": "w000101",
"onnx::PRelu_1506": "w000102",
"/Constant_output_0": "c000000",
"/Constant_1_output_0": "c000001",
"/Constant_2_output_0": "c000002",
"/Constant_3_output_0": "c000003",
"/Constant_4_output_0": "c000004",
"onnx::Unsqueeze_967": "c000005",
"/Constant_5_output_0": "c000006",
"/Constant_6_output_0": "c000007",
"onnx::Unsqueeze_973": "c000008",
"/Constant_7_output_0": "c000009",
"/Constant_8_output_0": "c000010",
"onnx::Unsqueeze_984": "c000011",
"onnx::Unsqueeze_986": "c000012",
"/Constant_9_output_0": "c000013",
"/decoder/embed/Constant_output_0": "c000014",
"/decoder/embed/Constant_1_output_0": "c000015",
"/decoder/embed/Constant_2_output_0": "c000016",
"/decoder/embed/Constant_3_output_0": "c000017",
"/decoder/embed/Constant_4_output_0": "c000018",
"/decoder/embed/Constant_5_output_0": "c000019",
"/decoder/embed/Constant_6_output_0": "c000020",
"/decoder/embed/Constant_7_output_0": "c000021",
"/decoder/convnext.0/dwconv/Constant_output_0": "c000022",
"/decoder/convnext.0/dwconv/Constant_1_output_0": "c000023",
"/decoder/convnext.0/dwconv/Constant_2_output_0": "c000024",
"/decoder/convnext.0/dwconv/Constant_3_output_0": "c000025",
"/decoder/convnext.0/dwconv/Constant_4_output_0": "c000026",
"/decoder/convnext.0/dwconv/Constant_5_output_0": "c000027",
"/decoder/convnext.0/dwconv/Constant_6_output_0": "c000028",
"/decoder/convnext.0/dwconv/Constant_7_output_0": "c000029",
"/decoder/convnext.0/act/Constant_output_0": "c000030",
"/decoder/convnext.0/act/Constant_1_output_0": "c000031",
"/decoder/convnext.0/act/Constant_2_output_0": "c000032",
"/decoder/convnext.1/dwconv/Constant_output_0": "c000033",
"/decoder/convnext.1/dwconv/Constant_1_output_0": "c000034",
"/decoder/convnext.1/dwconv/Constant_2_output_0": "c000035",
"/decoder/convnext.1/dwconv/Constant_3_output_0": "c000036",
"/decoder/convnext.1/dwconv/Constant_4_output_0": "c000037",
"/decoder/convnext.1/dwconv/Constant_5_output_0": "c000038",
"/decoder/convnext.1/dwconv/Constant_6_output_0": "c000039",
"/decoder/convnext.1/dwconv/Constant_7_output_0": "c000040",
"/decoder/convnext.1/act/Constant_output_0": "c000041",
"/decoder/convnext.1/act/Constant_1_output_0": "c000042",
"/decoder/convnext.1/act/Constant_2_output_0": "c000043",
"/decoder/convnext.2/dwconv/Constant_output_0": "c000044",
"/decoder/convnext.2/dwconv/Constant_1_output_0": "c000045",
"/decoder/convnext.2/dwconv/Constant_2_output_0": "c000046",
"/decoder/convnext.2/dwconv/Constant_3_output_0": "c000047",
"/decoder/convnext.2/dwconv/Constant_4_output_0": "c000048",
"/decoder/convnext.2/dwconv/Constant_5_output_0": "c000049",
"/decoder/convnext.2/dwconv/Constant_6_output_0": "c000050",
"/decoder/convnext.2/dwconv/Constant_7_output_0": "c000051",
"/decoder/convnext.2/act/Constant_output_0": "c000052",
"/decoder/convnext.2/act/Constant_1_output_0": "c000053",
"/decoder/convnext.2/act/Constant_2_output_0": "c000054",
"/decoder/convnext.3/dwconv/Constant_output_0": "c000055",
"/decoder/convnext.3/dwconv/Constant_1_output_0": "c000056",
"/decoder/convnext.3/dwconv/Constant_2_output_0": "c000057",
"/decoder/convnext.3/dwconv/Constant_3_output_0": "c000058",
"/decoder/convnext.3/dwconv/Constant_4_output_0": "c000059",
"/decoder/convnext.3/dwconv/Constant_5_output_0": "c000060",
"/decoder/convnext.3/dwconv/Constant_6_output_0": "c000061",
"/decoder/convnext.3/dwconv/Constant_7_output_0": "c000062",
"/decoder/convnext.3/act/Constant_output_0": "c000063",
"/decoder/convnext.3/act/Constant_1_output_0": "c000064",
"/decoder/convnext.3/act/Constant_2_output_0": "c000065",
"/decoder/convnext.4/dwconv/Constant_output_0": "c000066",
"/decoder/convnext.4/dwconv/Constant_1_output_0": "c000067",
"/decoder/convnext.4/dwconv/Constant_2_output_0": "c000068",
"/decoder/convnext.4/dwconv/Constant_3_output_0": "c000069",
"/decoder/convnext.4/dwconv/Constant_4_output_0": "c000070",
"/decoder/convnext.4/dwconv/Constant_5_output_0": "c000071",
"/decoder/convnext.4/dwconv/Constant_6_output_0": "c000072",
"/decoder/convnext.4/dwconv/Constant_7_output_0": "c000073",
"/decoder/convnext.4/act/Constant_output_0": "c000074",
"/decoder/convnext.4/act/Constant_1_output_0": "c000075",
"/decoder/convnext.4/act/Constant_2_output_0": "c000076",
"/decoder/convnext.5/dwconv/Constant_output_0": "c000077",
"/decoder/convnext.5/dwconv/Constant_1_output_0": "c000078",
"/decoder/convnext.5/dwconv/Constant_2_output_0": "c000079",
"/decoder/convnext.5/dwconv/Constant_3_output_0": "c000080",
"/decoder/convnext.5/dwconv/Constant_4_output_0": "c000081",
"/decoder/convnext.5/dwconv/Constant_5_output_0": "c000082",
"/decoder/convnext.5/dwconv/Constant_6_output_0": "c000083",
"/decoder/convnext.5/dwconv/Constant_7_output_0": "c000084",
"/decoder/convnext.5/act/Constant_output_0": "c000085",
"/decoder/convnext.5/act/Constant_1_output_0": "c000086",
"/decoder/convnext.5/act/Constant_2_output_0": "c000087",
"/decoder/convnext.6/dwconv/Constant_output_0": "c000088",
"/decoder/convnext.6/dwconv/Constant_1_output_0": "c000089",
"/decoder/convnext.6/dwconv/Constant_2_output_0": "c000090",
"/decoder/convnext.6/dwconv/Constant_3_output_0": "c000091",
"/decoder/convnext.6/dwconv/Constant_4_output_0": "c000092",
"/decoder/convnext.6/dwconv/Constant_5_output_0": "c000093",
"/decoder/convnext.6/dwconv/Constant_6_output_0": "c000094",
"/decoder/convnext.6/dwconv/Constant_7_output_0": "c000095",
"/decoder/convnext.6/act/Constant_output_0": "c000096",
"/decoder/convnext.6/act/Constant_1_output_0": "c000097",
"/decoder/convnext.6/act/Constant_2_output_0": "c000098",
"/decoder/convnext.7/dwconv/Constant_output_0": "c000099",
"/decoder/convnext.7/dwconv/Constant_1_output_0": "c000100",
"/decoder/convnext.7/dwconv/Constant_2_output_0": "c000101",
"/decoder/convnext.7/dwconv/Constant_3_output_0": "c000102",
"/decoder/convnext.7/dwconv/Constant_4_output_0": "c000103",
"/decoder/convnext.7/dwconv/Constant_5_output_0": "c000104",
"/decoder/convnext.7/dwconv/Constant_6_output_0": "c000105",
"/decoder/convnext.7/dwconv/Constant_7_output_0": "c000106",
"/decoder/convnext.7/act/Constant_output_0": "c000107",
"/decoder/convnext.7/act/Constant_1_output_0": "c000108",
"/decoder/convnext.7/act/Constant_2_output_0": "c000109",
"/decoder/convnext.8/dwconv/Constant_output_0": "c000110",
"/decoder/convnext.8/dwconv/Constant_1_output_0": "c000111",
"/decoder/convnext.8/dwconv/Constant_2_output_0": "c000112",
"/decoder/convnext.8/dwconv/Constant_3_output_0": "c000113",
"/decoder/convnext.8/dwconv/Constant_4_output_0": "c000114",
"/decoder/convnext.8/dwconv/Constant_5_output_0": "c000115",
"/decoder/convnext.8/dwconv/Constant_6_output_0": "c000116",
"/decoder/convnext.8/dwconv/Constant_7_output_0": "c000117",
"/decoder/convnext.8/act/Constant_output_0": "c000118",
"/decoder/convnext.8/act/Constant_1_output_0": "c000119",
"/decoder/convnext.8/act/Constant_2_output_0": "c000120",
"/decoder/convnext.9/dwconv/Constant_output_0": "c000121",
"/decoder/convnext.9/dwconv/Constant_1_output_0": "c000122",
"/decoder/convnext.9/dwconv/Constant_2_output_0": "c000123",
"/decoder/convnext.9/dwconv/Constant_3_output_0": "c000124",
"/decoder/convnext.9/dwconv/Constant_4_output_0": "c000125",
"/decoder/convnext.9/dwconv/Constant_5_output_0": "c000126",
"/decoder/convnext.9/dwconv/Constant_6_output_0": "c000127",
"/decoder/convnext.9/dwconv/Constant_7_output_0": "c000128",
"/decoder/convnext.9/act/Constant_output_0": "c000129",
"/decoder/convnext.9/act/Constant_1_output_0": "c000130",
"/decoder/convnext.9/act/Constant_2_output_0": "c000131",
"/decoder/head/layer1/Constant_output_0": "c000132",
"/decoder/head/layer1/Constant_1_output_0": "c000133",
"/decoder/head/layer1/Constant_2_output_0": "c000134",
"/decoder/head/layer1/Constant_3_output_0": "c000135",
"/decoder/head/layer1/Constant_4_output_0": "c000136",
"/decoder/head/layer1/Constant_5_output_0": "c000137",
"/decoder/head/layer1/Constant_6_output_0": "c000138",
"/decoder/head/layer1/Constant_7_output_0": "c000139",
"/decoder/head/Constant_output_0": "c000140",
"onnx::Unsqueeze_1434": "c000141",
"/decoder/head/Constant_1_output_0": "c000142"
},
"nodes": [
{
"op_type": "Div",
"name": "/Div",
"inputs": [
"latent",
"tts.ttl.normalizer.scale"
],
"outputs": [
"/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Shape",
"name": "/Shape",
"inputs": [
"/Div_output_0"
],
"outputs": [
"/Shape_output_0"
],
"attrs": {}
},
{
"op_type": "Gather",
"name": "/Gather",
"inputs": [
"/Shape_output_0",
"/Constant_output_0"
],
"outputs": [
"/Gather_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Shape",
"name": "/Shape_1",
"inputs": [
"/Div_output_0"
],
"outputs": [
"/Shape_1_output_0"
],
"attrs": {}
},
{
"op_type": "Slice",
"name": "/Slice",
"inputs": [
"/Shape_1_output_0",
"/Constant_2_output_0",
"/Constant_3_output_0",
"/Constant_1_output_0"
],
"outputs": [
"/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Squeeze",
"name": "/Squeeze",
"inputs": [
"/Slice_output_0",
"/Constant_4_output_0"
],
"outputs": [
"/Squeeze_output_0"
],
"attrs": {}
},
{
"op_type": "Unsqueeze",
"name": "/Unsqueeze",
"inputs": [
"/Gather_output_0",
"onnx::Unsqueeze_967"
],
"outputs": [
"/Unsqueeze_output_0"
],
"attrs": {}
},
{
"op_type": "Unsqueeze",
"name": "/Unsqueeze_1",
"inputs": [
"/Squeeze_output_0",
"onnx::Unsqueeze_973"
],
"outputs": [
"/Unsqueeze_1_output_0"
],
"attrs": {}
},
{
"op_type": "Concat",
"name": "/Concat",
"inputs": [
"/Unsqueeze_output_0",
"/Constant_5_output_0",
"/Constant_6_output_0",
"/Unsqueeze_1_output_0"
],
"outputs": [
"/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/Reshape",
"inputs": [
"/Div_output_0",
"/Concat_output_0"
],
"outputs": [
"/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Transpose",
"name": "/Transpose",
"inputs": [
"/Reshape_output_0"
],
"outputs": [
"/Transpose_output_0"
],
"attrs": {
"perm": [
0,
1,
3,
2
]
}
},
{
"op_type": "Shape",
"name": "/Shape_2",
"inputs": [
"/Transpose_output_0"
],
"outputs": [
"/Shape_2_output_0"
],
"attrs": {}
},
{
"op_type": "Gather",
"name": "/Gather_1",
"inputs": [
"/Shape_2_output_0",
"/Constant_7_output_0"
],
"outputs": [
"/Gather_1_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Shape",
"name": "/Shape_3",
"inputs": [
"/Transpose_output_0"
],
"outputs": [
"/Shape_3_output_0"
],
"attrs": {}
},
{
"op_type": "Gather",
"name": "/Gather_2",
"inputs": [
"/Shape_3_output_0",
"/Constant_8_output_0"
],
"outputs": [
"/Gather_2_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Unsqueeze",
"name": "/Unsqueeze_2",
"inputs": [
"/Gather_1_output_0",
"onnx::Unsqueeze_984"
],
"outputs": [
"/Unsqueeze_2_output_0"
],
"attrs": {}
},
{
"op_type": "Unsqueeze",
"name": "/Unsqueeze_3",
"inputs": [
"/Gather_2_output_0",
"onnx::Unsqueeze_986"
],
"outputs": [
"/Unsqueeze_3_output_0"
],
"attrs": {}
},
{
"op_type": "Concat",
"name": "/Concat_1",
"inputs": [
"/Unsqueeze_2_output_0",
"/Unsqueeze_3_output_0",
"/Constant_9_output_0"
],
"outputs": [
"/Concat_1_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/Reshape_1",
"inputs": [
"/Transpose_output_0",
"/Concat_1_output_0"
],
"outputs": [
"/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Mul",
"name": "/Mul",
"inputs": [
"/Reshape_1_output_0",
"tts.ae.latent_std"
],
"outputs": [
"/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/Add",
"inputs": [
"/Mul_output_0",
"tts.ae.latent_mean"
],
"outputs": [
"/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/embed/ConstantOfShape",
"inputs": [
"/decoder/embed/Constant_output_0"
],
"outputs": [
"/decoder/embed/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/embed/Concat",
"inputs": [
"/decoder/embed/Constant_1_output_0",
"/decoder/embed/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/embed/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/embed/Reshape",
"inputs": [
"/decoder/embed/Concat_output_0",
"/decoder/embed/Constant_2_output_0"
],
"outputs": [
"/decoder/embed/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/embed/Slice",
"inputs": [
"/decoder/embed/Reshape_output_0",
"/decoder/embed/Constant_4_output_0",
"/decoder/embed/Constant_5_output_0",
"/decoder/embed/Constant_3_output_0",
"/decoder/embed/Constant_6_output_0"
],
"outputs": [
"/decoder/embed/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/embed/Transpose",
"inputs": [
"/decoder/embed/Slice_output_0"
],
"outputs": [
"/decoder/embed/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/embed/Reshape_1",
"inputs": [
"/decoder/embed/Transpose_output_0",
"/decoder/embed/Constant_7_output_0"
],
"outputs": [
"/decoder/embed/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/embed/Cast",
"inputs": [
"/decoder/embed/Reshape_1_output_0"
],
"outputs": [
"/decoder/embed/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/embed/Pad",
"inputs": [
"/Add_output_0",
"/decoder/embed/Cast_output_0"
],
"outputs": [
"/decoder/embed/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/embed/net/Conv",
"inputs": [
"/decoder/embed/Pad_output_0",
"onnx::Conv_1441",
"onnx::Conv_1442"
],
"outputs": [
"/decoder/embed/net/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.0/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.0/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.0/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.0/dwconv/Concat",
"inputs": [
"/decoder/convnext.0/dwconv/Constant_1_output_0",
"/decoder/convnext.0/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.0/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.0/dwconv/Reshape",
"inputs": [
"/decoder/convnext.0/dwconv/Concat_output_0",
"/decoder/convnext.0/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.0/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.0/dwconv/Slice",
"inputs": [
"/decoder/convnext.0/dwconv/Reshape_output_0",
"/decoder/convnext.0/dwconv/Constant_4_output_0",
"/decoder/convnext.0/dwconv/Constant_5_output_0",
"/decoder/convnext.0/dwconv/Constant_3_output_0",
"/decoder/convnext.0/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.0/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.0/dwconv/Transpose",
"inputs": [
"/decoder/convnext.0/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.0/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.0/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.0/dwconv/Transpose_output_0",
"/decoder/convnext.0/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.0/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.0/dwconv/Cast",
"inputs": [
"/decoder/convnext.0/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.0/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.0/dwconv/Pad",
"inputs": [
"/decoder/embed/net/Conv_output_0",
"/decoder/convnext.0/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.0/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.0/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.0/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.0.dwconv.net.weight",
"tts.ae.decoder.convnext.0.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.0/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.0/norm/Transpose",
"inputs": [
"/decoder/convnext.0/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.0/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.0/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.0/norm/Transpose_output_0",
"tts.ae.decoder.convnext.0.norm.norm.weight",
"tts.ae.decoder.convnext.0.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.0/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.0/norm/Transpose_1",
"inputs": [
"/decoder/convnext.0/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.0/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.0/pwconv1/Conv",
"inputs": [
"/decoder/convnext.0/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.0.pwconv1.weight",
"tts.ae.decoder.convnext.0.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.0/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.0/act/Div",
"inputs": [
"/decoder/convnext.0/pwconv1/Conv_output_0",
"/decoder/convnext.0/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.0/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.0/act/Erf",
"inputs": [
"/decoder/convnext.0/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.0/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.0/act/Add",
"inputs": [
"/decoder/convnext.0/act/Erf_output_0",
"/decoder/convnext.0/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.0/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.0/act/Mul",
"inputs": [
"/decoder/convnext.0/pwconv1/Conv_output_0",
"/decoder/convnext.0/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.0/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.0/act/Mul_1",
"inputs": [
"/decoder/convnext.0/act/Mul_output_0",
"/decoder/convnext.0/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.0/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.0/pwconv2/Conv",
"inputs": [
"/decoder/convnext.0/act/Mul_1_output_0",
"tts.ae.decoder.convnext.0.pwconv2.weight",
"tts.ae.decoder.convnext.0.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.0/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.0/Mul",
"inputs": [
"tts.ae.decoder.convnext.0.gamma",
"/decoder/convnext.0/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.0/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.0/Add",
"inputs": [
"/decoder/embed/net/Conv_output_0",
"/decoder/convnext.0/Mul_output_0"
],
"outputs": [
"/decoder/convnext.0/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.1/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.1/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.1/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.1/dwconv/Concat",
"inputs": [
"/decoder/convnext.1/dwconv/Constant_1_output_0",
"/decoder/convnext.1/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.1/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.1/dwconv/Reshape",
"inputs": [
"/decoder/convnext.1/dwconv/Concat_output_0",
"/decoder/convnext.1/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.1/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.1/dwconv/Slice",
"inputs": [
"/decoder/convnext.1/dwconv/Reshape_output_0",
"/decoder/convnext.1/dwconv/Constant_4_output_0",
"/decoder/convnext.1/dwconv/Constant_5_output_0",
"/decoder/convnext.1/dwconv/Constant_3_output_0",
"/decoder/convnext.1/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.1/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.1/dwconv/Transpose",
"inputs": [
"/decoder/convnext.1/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.1/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.1/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.1/dwconv/Transpose_output_0",
"/decoder/convnext.1/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.1/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.1/dwconv/Cast",
"inputs": [
"/decoder/convnext.1/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.1/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.1/dwconv/Pad",
"inputs": [
"/decoder/convnext.0/Add_output_0",
"/decoder/convnext.1/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.1/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.1/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.1/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.1.dwconv.net.weight",
"tts.ae.decoder.convnext.1.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.1/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
2
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.1/norm/Transpose",
"inputs": [
"/decoder/convnext.1/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.1/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.1/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.1/norm/Transpose_output_0",
"tts.ae.decoder.convnext.1.norm.norm.weight",
"tts.ae.decoder.convnext.1.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.1/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.1/norm/Transpose_1",
"inputs": [
"/decoder/convnext.1/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.1/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.1/pwconv1/Conv",
"inputs": [
"/decoder/convnext.1/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.1.pwconv1.weight",
"tts.ae.decoder.convnext.1.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.1/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.1/act/Div",
"inputs": [
"/decoder/convnext.1/pwconv1/Conv_output_0",
"/decoder/convnext.1/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.1/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.1/act/Erf",
"inputs": [
"/decoder/convnext.1/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.1/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.1/act/Add",
"inputs": [
"/decoder/convnext.1/act/Erf_output_0",
"/decoder/convnext.1/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.1/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.1/act/Mul",
"inputs": [
"/decoder/convnext.1/pwconv1/Conv_output_0",
"/decoder/convnext.1/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.1/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.1/act/Mul_1",
"inputs": [
"/decoder/convnext.1/act/Mul_output_0",
"/decoder/convnext.1/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.1/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.1/pwconv2/Conv",
"inputs": [
"/decoder/convnext.1/act/Mul_1_output_0",
"tts.ae.decoder.convnext.1.pwconv2.weight",
"tts.ae.decoder.convnext.1.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.1/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.1/Mul",
"inputs": [
"tts.ae.decoder.convnext.1.gamma",
"/decoder/convnext.1/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.1/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.1/Add",
"inputs": [
"/decoder/convnext.0/Add_output_0",
"/decoder/convnext.1/Mul_output_0"
],
"outputs": [
"/decoder/convnext.1/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.2/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.2/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.2/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.2/dwconv/Concat",
"inputs": [
"/decoder/convnext.2/dwconv/Constant_1_output_0",
"/decoder/convnext.2/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.2/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.2/dwconv/Reshape",
"inputs": [
"/decoder/convnext.2/dwconv/Concat_output_0",
"/decoder/convnext.2/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.2/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.2/dwconv/Slice",
"inputs": [
"/decoder/convnext.2/dwconv/Reshape_output_0",
"/decoder/convnext.2/dwconv/Constant_4_output_0",
"/decoder/convnext.2/dwconv/Constant_5_output_0",
"/decoder/convnext.2/dwconv/Constant_3_output_0",
"/decoder/convnext.2/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.2/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.2/dwconv/Transpose",
"inputs": [
"/decoder/convnext.2/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.2/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.2/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.2/dwconv/Transpose_output_0",
"/decoder/convnext.2/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.2/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.2/dwconv/Cast",
"inputs": [
"/decoder/convnext.2/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.2/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.2/dwconv/Pad",
"inputs": [
"/decoder/convnext.1/Add_output_0",
"/decoder/convnext.2/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.2/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.2/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.2/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.2.dwconv.net.weight",
"tts.ae.decoder.convnext.2.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.2/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
4
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.2/norm/Transpose",
"inputs": [
"/decoder/convnext.2/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.2/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.2/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.2/norm/Transpose_output_0",
"tts.ae.decoder.convnext.2.norm.norm.weight",
"tts.ae.decoder.convnext.2.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.2/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.2/norm/Transpose_1",
"inputs": [
"/decoder/convnext.2/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.2/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.2/pwconv1/Conv",
"inputs": [
"/decoder/convnext.2/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.2.pwconv1.weight",
"tts.ae.decoder.convnext.2.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.2/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.2/act/Div",
"inputs": [
"/decoder/convnext.2/pwconv1/Conv_output_0",
"/decoder/convnext.2/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.2/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.2/act/Erf",
"inputs": [
"/decoder/convnext.2/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.2/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.2/act/Add",
"inputs": [
"/decoder/convnext.2/act/Erf_output_0",
"/decoder/convnext.2/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.2/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.2/act/Mul",
"inputs": [
"/decoder/convnext.2/pwconv1/Conv_output_0",
"/decoder/convnext.2/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.2/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.2/act/Mul_1",
"inputs": [
"/decoder/convnext.2/act/Mul_output_0",
"/decoder/convnext.2/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.2/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.2/pwconv2/Conv",
"inputs": [
"/decoder/convnext.2/act/Mul_1_output_0",
"tts.ae.decoder.convnext.2.pwconv2.weight",
"tts.ae.decoder.convnext.2.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.2/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.2/Mul",
"inputs": [
"tts.ae.decoder.convnext.2.gamma",
"/decoder/convnext.2/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.2/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.2/Add",
"inputs": [
"/decoder/convnext.1/Add_output_0",
"/decoder/convnext.2/Mul_output_0"
],
"outputs": [
"/decoder/convnext.2/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.3/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.3/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.3/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.3/dwconv/Concat",
"inputs": [
"/decoder/convnext.3/dwconv/Constant_1_output_0",
"/decoder/convnext.3/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.3/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.3/dwconv/Reshape",
"inputs": [
"/decoder/convnext.3/dwconv/Concat_output_0",
"/decoder/convnext.3/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.3/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.3/dwconv/Slice",
"inputs": [
"/decoder/convnext.3/dwconv/Reshape_output_0",
"/decoder/convnext.3/dwconv/Constant_4_output_0",
"/decoder/convnext.3/dwconv/Constant_5_output_0",
"/decoder/convnext.3/dwconv/Constant_3_output_0",
"/decoder/convnext.3/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.3/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.3/dwconv/Transpose",
"inputs": [
"/decoder/convnext.3/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.3/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.3/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.3/dwconv/Transpose_output_0",
"/decoder/convnext.3/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.3/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.3/dwconv/Cast",
"inputs": [
"/decoder/convnext.3/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.3/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.3/dwconv/Pad",
"inputs": [
"/decoder/convnext.2/Add_output_0",
"/decoder/convnext.3/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.3/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.3/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.3/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.3.dwconv.net.weight",
"tts.ae.decoder.convnext.3.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.3/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.3/norm/Transpose",
"inputs": [
"/decoder/convnext.3/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.3/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.3/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.3/norm/Transpose_output_0",
"tts.ae.decoder.convnext.3.norm.norm.weight",
"tts.ae.decoder.convnext.3.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.3/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.3/norm/Transpose_1",
"inputs": [
"/decoder/convnext.3/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.3/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.3/pwconv1/Conv",
"inputs": [
"/decoder/convnext.3/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.3.pwconv1.weight",
"tts.ae.decoder.convnext.3.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.3/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.3/act/Div",
"inputs": [
"/decoder/convnext.3/pwconv1/Conv_output_0",
"/decoder/convnext.3/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.3/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.3/act/Erf",
"inputs": [
"/decoder/convnext.3/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.3/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.3/act/Add",
"inputs": [
"/decoder/convnext.3/act/Erf_output_0",
"/decoder/convnext.3/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.3/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.3/act/Mul",
"inputs": [
"/decoder/convnext.3/pwconv1/Conv_output_0",
"/decoder/convnext.3/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.3/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.3/act/Mul_1",
"inputs": [
"/decoder/convnext.3/act/Mul_output_0",
"/decoder/convnext.3/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.3/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.3/pwconv2/Conv",
"inputs": [
"/decoder/convnext.3/act/Mul_1_output_0",
"tts.ae.decoder.convnext.3.pwconv2.weight",
"tts.ae.decoder.convnext.3.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.3/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.3/Mul",
"inputs": [
"tts.ae.decoder.convnext.3.gamma",
"/decoder/convnext.3/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.3/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.3/Add",
"inputs": [
"/decoder/convnext.2/Add_output_0",
"/decoder/convnext.3/Mul_output_0"
],
"outputs": [
"/decoder/convnext.3/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.4/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.4/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.4/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.4/dwconv/Concat",
"inputs": [
"/decoder/convnext.4/dwconv/Constant_1_output_0",
"/decoder/convnext.4/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.4/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.4/dwconv/Reshape",
"inputs": [
"/decoder/convnext.4/dwconv/Concat_output_0",
"/decoder/convnext.4/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.4/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.4/dwconv/Slice",
"inputs": [
"/decoder/convnext.4/dwconv/Reshape_output_0",
"/decoder/convnext.4/dwconv/Constant_4_output_0",
"/decoder/convnext.4/dwconv/Constant_5_output_0",
"/decoder/convnext.4/dwconv/Constant_3_output_0",
"/decoder/convnext.4/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.4/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.4/dwconv/Transpose",
"inputs": [
"/decoder/convnext.4/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.4/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.4/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.4/dwconv/Transpose_output_0",
"/decoder/convnext.4/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.4/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.4/dwconv/Cast",
"inputs": [
"/decoder/convnext.4/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.4/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.4/dwconv/Pad",
"inputs": [
"/decoder/convnext.3/Add_output_0",
"/decoder/convnext.4/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.4/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.4/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.4/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.4.dwconv.net.weight",
"tts.ae.decoder.convnext.4.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.4/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
2
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.4/norm/Transpose",
"inputs": [
"/decoder/convnext.4/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.4/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.4/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.4/norm/Transpose_output_0",
"tts.ae.decoder.convnext.4.norm.norm.weight",
"tts.ae.decoder.convnext.4.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.4/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.4/norm/Transpose_1",
"inputs": [
"/decoder/convnext.4/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.4/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.4/pwconv1/Conv",
"inputs": [
"/decoder/convnext.4/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.4.pwconv1.weight",
"tts.ae.decoder.convnext.4.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.4/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.4/act/Div",
"inputs": [
"/decoder/convnext.4/pwconv1/Conv_output_0",
"/decoder/convnext.4/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.4/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.4/act/Erf",
"inputs": [
"/decoder/convnext.4/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.4/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.4/act/Add",
"inputs": [
"/decoder/convnext.4/act/Erf_output_0",
"/decoder/convnext.4/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.4/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.4/act/Mul",
"inputs": [
"/decoder/convnext.4/pwconv1/Conv_output_0",
"/decoder/convnext.4/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.4/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.4/act/Mul_1",
"inputs": [
"/decoder/convnext.4/act/Mul_output_0",
"/decoder/convnext.4/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.4/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.4/pwconv2/Conv",
"inputs": [
"/decoder/convnext.4/act/Mul_1_output_0",
"tts.ae.decoder.convnext.4.pwconv2.weight",
"tts.ae.decoder.convnext.4.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.4/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.4/Mul",
"inputs": [
"tts.ae.decoder.convnext.4.gamma",
"/decoder/convnext.4/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.4/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.4/Add",
"inputs": [
"/decoder/convnext.3/Add_output_0",
"/decoder/convnext.4/Mul_output_0"
],
"outputs": [
"/decoder/convnext.4/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.5/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.5/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.5/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.5/dwconv/Concat",
"inputs": [
"/decoder/convnext.5/dwconv/Constant_1_output_0",
"/decoder/convnext.5/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.5/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.5/dwconv/Reshape",
"inputs": [
"/decoder/convnext.5/dwconv/Concat_output_0",
"/decoder/convnext.5/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.5/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.5/dwconv/Slice",
"inputs": [
"/decoder/convnext.5/dwconv/Reshape_output_0",
"/decoder/convnext.5/dwconv/Constant_4_output_0",
"/decoder/convnext.5/dwconv/Constant_5_output_0",
"/decoder/convnext.5/dwconv/Constant_3_output_0",
"/decoder/convnext.5/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.5/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.5/dwconv/Transpose",
"inputs": [
"/decoder/convnext.5/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.5/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.5/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.5/dwconv/Transpose_output_0",
"/decoder/convnext.5/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.5/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.5/dwconv/Cast",
"inputs": [
"/decoder/convnext.5/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.5/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.5/dwconv/Pad",
"inputs": [
"/decoder/convnext.4/Add_output_0",
"/decoder/convnext.5/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.5/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.5/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.5/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.5.dwconv.net.weight",
"tts.ae.decoder.convnext.5.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.5/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
4
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.5/norm/Transpose",
"inputs": [
"/decoder/convnext.5/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.5/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.5/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.5/norm/Transpose_output_0",
"tts.ae.decoder.convnext.5.norm.norm.weight",
"tts.ae.decoder.convnext.5.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.5/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.5/norm/Transpose_1",
"inputs": [
"/decoder/convnext.5/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.5/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.5/pwconv1/Conv",
"inputs": [
"/decoder/convnext.5/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.5.pwconv1.weight",
"tts.ae.decoder.convnext.5.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.5/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.5/act/Div",
"inputs": [
"/decoder/convnext.5/pwconv1/Conv_output_0",
"/decoder/convnext.5/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.5/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.5/act/Erf",
"inputs": [
"/decoder/convnext.5/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.5/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.5/act/Add",
"inputs": [
"/decoder/convnext.5/act/Erf_output_0",
"/decoder/convnext.5/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.5/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.5/act/Mul",
"inputs": [
"/decoder/convnext.5/pwconv1/Conv_output_0",
"/decoder/convnext.5/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.5/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.5/act/Mul_1",
"inputs": [
"/decoder/convnext.5/act/Mul_output_0",
"/decoder/convnext.5/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.5/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.5/pwconv2/Conv",
"inputs": [
"/decoder/convnext.5/act/Mul_1_output_0",
"tts.ae.decoder.convnext.5.pwconv2.weight",
"tts.ae.decoder.convnext.5.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.5/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.5/Mul",
"inputs": [
"tts.ae.decoder.convnext.5.gamma",
"/decoder/convnext.5/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.5/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.5/Add",
"inputs": [
"/decoder/convnext.4/Add_output_0",
"/decoder/convnext.5/Mul_output_0"
],
"outputs": [
"/decoder/convnext.5/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.6/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.6/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.6/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.6/dwconv/Concat",
"inputs": [
"/decoder/convnext.6/dwconv/Constant_1_output_0",
"/decoder/convnext.6/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.6/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.6/dwconv/Reshape",
"inputs": [
"/decoder/convnext.6/dwconv/Concat_output_0",
"/decoder/convnext.6/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.6/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.6/dwconv/Slice",
"inputs": [
"/decoder/convnext.6/dwconv/Reshape_output_0",
"/decoder/convnext.6/dwconv/Constant_4_output_0",
"/decoder/convnext.6/dwconv/Constant_5_output_0",
"/decoder/convnext.6/dwconv/Constant_3_output_0",
"/decoder/convnext.6/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.6/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.6/dwconv/Transpose",
"inputs": [
"/decoder/convnext.6/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.6/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.6/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.6/dwconv/Transpose_output_0",
"/decoder/convnext.6/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.6/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.6/dwconv/Cast",
"inputs": [
"/decoder/convnext.6/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.6/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.6/dwconv/Pad",
"inputs": [
"/decoder/convnext.5/Add_output_0",
"/decoder/convnext.6/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.6/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.6/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.6/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.6.dwconv.net.weight",
"tts.ae.decoder.convnext.6.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.6/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.6/norm/Transpose",
"inputs": [
"/decoder/convnext.6/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.6/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.6/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.6/norm/Transpose_output_0",
"tts.ae.decoder.convnext.6.norm.norm.weight",
"tts.ae.decoder.convnext.6.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.6/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.6/norm/Transpose_1",
"inputs": [
"/decoder/convnext.6/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.6/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.6/pwconv1/Conv",
"inputs": [
"/decoder/convnext.6/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.6.pwconv1.weight",
"tts.ae.decoder.convnext.6.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.6/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.6/act/Div",
"inputs": [
"/decoder/convnext.6/pwconv1/Conv_output_0",
"/decoder/convnext.6/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.6/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.6/act/Erf",
"inputs": [
"/decoder/convnext.6/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.6/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.6/act/Add",
"inputs": [
"/decoder/convnext.6/act/Erf_output_0",
"/decoder/convnext.6/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.6/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.6/act/Mul",
"inputs": [
"/decoder/convnext.6/pwconv1/Conv_output_0",
"/decoder/convnext.6/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.6/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.6/act/Mul_1",
"inputs": [
"/decoder/convnext.6/act/Mul_output_0",
"/decoder/convnext.6/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.6/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.6/pwconv2/Conv",
"inputs": [
"/decoder/convnext.6/act/Mul_1_output_0",
"tts.ae.decoder.convnext.6.pwconv2.weight",
"tts.ae.decoder.convnext.6.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.6/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.6/Mul",
"inputs": [
"tts.ae.decoder.convnext.6.gamma",
"/decoder/convnext.6/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.6/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.6/Add",
"inputs": [
"/decoder/convnext.5/Add_output_0",
"/decoder/convnext.6/Mul_output_0"
],
"outputs": [
"/decoder/convnext.6/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.7/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.7/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.7/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.7/dwconv/Concat",
"inputs": [
"/decoder/convnext.7/dwconv/Constant_1_output_0",
"/decoder/convnext.7/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.7/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.7/dwconv/Reshape",
"inputs": [
"/decoder/convnext.7/dwconv/Concat_output_0",
"/decoder/convnext.7/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.7/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.7/dwconv/Slice",
"inputs": [
"/decoder/convnext.7/dwconv/Reshape_output_0",
"/decoder/convnext.7/dwconv/Constant_4_output_0",
"/decoder/convnext.7/dwconv/Constant_5_output_0",
"/decoder/convnext.7/dwconv/Constant_3_output_0",
"/decoder/convnext.7/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.7/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.7/dwconv/Transpose",
"inputs": [
"/decoder/convnext.7/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.7/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.7/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.7/dwconv/Transpose_output_0",
"/decoder/convnext.7/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.7/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.7/dwconv/Cast",
"inputs": [
"/decoder/convnext.7/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.7/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.7/dwconv/Pad",
"inputs": [
"/decoder/convnext.6/Add_output_0",
"/decoder/convnext.7/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.7/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.7/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.7/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.7.dwconv.net.weight",
"tts.ae.decoder.convnext.7.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.7/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.7/norm/Transpose",
"inputs": [
"/decoder/convnext.7/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.7/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.7/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.7/norm/Transpose_output_0",
"tts.ae.decoder.convnext.7.norm.norm.weight",
"tts.ae.decoder.convnext.7.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.7/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.7/norm/Transpose_1",
"inputs": [
"/decoder/convnext.7/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.7/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.7/pwconv1/Conv",
"inputs": [
"/decoder/convnext.7/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.7.pwconv1.weight",
"tts.ae.decoder.convnext.7.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.7/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.7/act/Div",
"inputs": [
"/decoder/convnext.7/pwconv1/Conv_output_0",
"/decoder/convnext.7/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.7/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.7/act/Erf",
"inputs": [
"/decoder/convnext.7/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.7/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.7/act/Add",
"inputs": [
"/decoder/convnext.7/act/Erf_output_0",
"/decoder/convnext.7/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.7/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.7/act/Mul",
"inputs": [
"/decoder/convnext.7/pwconv1/Conv_output_0",
"/decoder/convnext.7/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.7/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.7/act/Mul_1",
"inputs": [
"/decoder/convnext.7/act/Mul_output_0",
"/decoder/convnext.7/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.7/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.7/pwconv2/Conv",
"inputs": [
"/decoder/convnext.7/act/Mul_1_output_0",
"tts.ae.decoder.convnext.7.pwconv2.weight",
"tts.ae.decoder.convnext.7.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.7/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.7/Mul",
"inputs": [
"tts.ae.decoder.convnext.7.gamma",
"/decoder/convnext.7/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.7/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.7/Add",
"inputs": [
"/decoder/convnext.6/Add_output_0",
"/decoder/convnext.7/Mul_output_0"
],
"outputs": [
"/decoder/convnext.7/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.8/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.8/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.8/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.8/dwconv/Concat",
"inputs": [
"/decoder/convnext.8/dwconv/Constant_1_output_0",
"/decoder/convnext.8/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.8/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.8/dwconv/Reshape",
"inputs": [
"/decoder/convnext.8/dwconv/Concat_output_0",
"/decoder/convnext.8/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.8/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.8/dwconv/Slice",
"inputs": [
"/decoder/convnext.8/dwconv/Reshape_output_0",
"/decoder/convnext.8/dwconv/Constant_4_output_0",
"/decoder/convnext.8/dwconv/Constant_5_output_0",
"/decoder/convnext.8/dwconv/Constant_3_output_0",
"/decoder/convnext.8/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.8/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.8/dwconv/Transpose",
"inputs": [
"/decoder/convnext.8/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.8/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.8/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.8/dwconv/Transpose_output_0",
"/decoder/convnext.8/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.8/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.8/dwconv/Cast",
"inputs": [
"/decoder/convnext.8/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.8/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.8/dwconv/Pad",
"inputs": [
"/decoder/convnext.7/Add_output_0",
"/decoder/convnext.8/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.8/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.8/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.8/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.8.dwconv.net.weight",
"tts.ae.decoder.convnext.8.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.8/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.8/norm/Transpose",
"inputs": [
"/decoder/convnext.8/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.8/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.8/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.8/norm/Transpose_output_0",
"tts.ae.decoder.convnext.8.norm.norm.weight",
"tts.ae.decoder.convnext.8.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.8/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.8/norm/Transpose_1",
"inputs": [
"/decoder/convnext.8/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.8/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.8/pwconv1/Conv",
"inputs": [
"/decoder/convnext.8/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.8.pwconv1.weight",
"tts.ae.decoder.convnext.8.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.8/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.8/act/Div",
"inputs": [
"/decoder/convnext.8/pwconv1/Conv_output_0",
"/decoder/convnext.8/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.8/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.8/act/Erf",
"inputs": [
"/decoder/convnext.8/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.8/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.8/act/Add",
"inputs": [
"/decoder/convnext.8/act/Erf_output_0",
"/decoder/convnext.8/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.8/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.8/act/Mul",
"inputs": [
"/decoder/convnext.8/pwconv1/Conv_output_0",
"/decoder/convnext.8/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.8/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.8/act/Mul_1",
"inputs": [
"/decoder/convnext.8/act/Mul_output_0",
"/decoder/convnext.8/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.8/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.8/pwconv2/Conv",
"inputs": [
"/decoder/convnext.8/act/Mul_1_output_0",
"tts.ae.decoder.convnext.8.pwconv2.weight",
"tts.ae.decoder.convnext.8.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.8/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.8/Mul",
"inputs": [
"tts.ae.decoder.convnext.8.gamma",
"/decoder/convnext.8/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.8/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.8/Add",
"inputs": [
"/decoder/convnext.7/Add_output_0",
"/decoder/convnext.8/Mul_output_0"
],
"outputs": [
"/decoder/convnext.8/Add_output_0"
],
"attrs": {}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/convnext.9/dwconv/ConstantOfShape",
"inputs": [
"/decoder/convnext.9/dwconv/Constant_output_0"
],
"outputs": [
"/decoder/convnext.9/dwconv/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/convnext.9/dwconv/Concat",
"inputs": [
"/decoder/convnext.9/dwconv/Constant_1_output_0",
"/decoder/convnext.9/dwconv/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/convnext.9/dwconv/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.9/dwconv/Reshape",
"inputs": [
"/decoder/convnext.9/dwconv/Concat_output_0",
"/decoder/convnext.9/dwconv/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.9/dwconv/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/convnext.9/dwconv/Slice",
"inputs": [
"/decoder/convnext.9/dwconv/Reshape_output_0",
"/decoder/convnext.9/dwconv/Constant_4_output_0",
"/decoder/convnext.9/dwconv/Constant_5_output_0",
"/decoder/convnext.9/dwconv/Constant_3_output_0",
"/decoder/convnext.9/dwconv/Constant_6_output_0"
],
"outputs": [
"/decoder/convnext.9/dwconv/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.9/dwconv/Transpose",
"inputs": [
"/decoder/convnext.9/dwconv/Slice_output_0"
],
"outputs": [
"/decoder/convnext.9/dwconv/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/convnext.9/dwconv/Reshape_1",
"inputs": [
"/decoder/convnext.9/dwconv/Transpose_output_0",
"/decoder/convnext.9/dwconv/Constant_7_output_0"
],
"outputs": [
"/decoder/convnext.9/dwconv/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/convnext.9/dwconv/Cast",
"inputs": [
"/decoder/convnext.9/dwconv/Reshape_1_output_0"
],
"outputs": [
"/decoder/convnext.9/dwconv/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/convnext.9/dwconv/Pad",
"inputs": [
"/decoder/convnext.8/Add_output_0",
"/decoder/convnext.9/dwconv/Cast_output_0"
],
"outputs": [
"/decoder/convnext.9/dwconv/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.9/dwconv/net/Conv",
"inputs": [
"/decoder/convnext.9/dwconv/Pad_output_0",
"tts.ae.decoder.convnext.9.dwconv.net.weight",
"tts.ae.decoder.convnext.9.dwconv.net.bias"
],
"outputs": [
"/decoder/convnext.9/dwconv/net/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 512,
"kernel_shape": [
7
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.9/norm/Transpose",
"inputs": [
"/decoder/convnext.9/dwconv/net/Conv_output_0"
],
"outputs": [
"/decoder/convnext.9/norm/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "LayerNormalization",
"name": "/decoder/convnext.9/norm/norm/LayerNormalization",
"inputs": [
"/decoder/convnext.9/norm/Transpose_output_0",
"tts.ae.decoder.convnext.9.norm.norm.weight",
"tts.ae.decoder.convnext.9.norm.norm.bias"
],
"outputs": [
"/decoder/convnext.9/norm/norm/LayerNormalization_output_0"
],
"attrs": {
"axis": -1,
"epsilon": 9.999999974752427e-07
}
},
{
"op_type": "Transpose",
"name": "/decoder/convnext.9/norm/Transpose_1",
"inputs": [
"/decoder/convnext.9/norm/norm/LayerNormalization_output_0"
],
"outputs": [
"/decoder/convnext.9/norm/Transpose_1_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.9/pwconv1/Conv",
"inputs": [
"/decoder/convnext.9/norm/Transpose_1_output_0",
"tts.ae.decoder.convnext.9.pwconv1.weight",
"tts.ae.decoder.convnext.9.pwconv1.bias"
],
"outputs": [
"/decoder/convnext.9/pwconv1/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Div",
"name": "/decoder/convnext.9/act/Div",
"inputs": [
"/decoder/convnext.9/pwconv1/Conv_output_0",
"/decoder/convnext.9/act/Constant_output_0"
],
"outputs": [
"/decoder/convnext.9/act/Div_output_0"
],
"attrs": {}
},
{
"op_type": "Erf",
"name": "/decoder/convnext.9/act/Erf",
"inputs": [
"/decoder/convnext.9/act/Div_output_0"
],
"outputs": [
"/decoder/convnext.9/act/Erf_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.9/act/Add",
"inputs": [
"/decoder/convnext.9/act/Erf_output_0",
"/decoder/convnext.9/act/Constant_1_output_0"
],
"outputs": [
"/decoder/convnext.9/act/Add_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.9/act/Mul",
"inputs": [
"/decoder/convnext.9/pwconv1/Conv_output_0",
"/decoder/convnext.9/act/Add_output_0"
],
"outputs": [
"/decoder/convnext.9/act/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.9/act/Mul_1",
"inputs": [
"/decoder/convnext.9/act/Mul_output_0",
"/decoder/convnext.9/act/Constant_2_output_0"
],
"outputs": [
"/decoder/convnext.9/act/Mul_1_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/convnext.9/pwconv2/Conv",
"inputs": [
"/decoder/convnext.9/act/Mul_1_output_0",
"tts.ae.decoder.convnext.9.pwconv2.weight",
"tts.ae.decoder.convnext.9.pwconv2.bias"
],
"outputs": [
"/decoder/convnext.9/pwconv2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Mul",
"name": "/decoder/convnext.9/Mul",
"inputs": [
"tts.ae.decoder.convnext.9.gamma",
"/decoder/convnext.9/pwconv2/Conv_output_0"
],
"outputs": [
"/decoder/convnext.9/Mul_output_0"
],
"attrs": {}
},
{
"op_type": "Add",
"name": "/decoder/convnext.9/Add",
"inputs": [
"/decoder/convnext.8/Add_output_0",
"/decoder/convnext.9/Mul_output_0"
],
"outputs": [
"/decoder/convnext.9/Add_output_0"
],
"attrs": {}
},
{
"op_type": "BatchNormalization",
"name": "/decoder/final_norm/BatchNormalization",
"inputs": [
"/decoder/convnext.9/Add_output_0",
"tts.ae.decoder.final_norm.norm.weight",
"tts.ae.decoder.final_norm.norm.bias",
"tts.ae.decoder.final_norm.norm.running_mean",
"tts.ae.decoder.final_norm.norm.running_var"
],
"outputs": [
"/decoder/final_norm/BatchNormalization_output_0"
],
"attrs": {
"epsilon": 9.999999747378752e-06,
"momentum": 0.8999999761581421,
"training_mode": 0
}
},
{
"op_type": "ConstantOfShape",
"name": "/decoder/head/layer1/ConstantOfShape",
"inputs": [
"/decoder/head/layer1/Constant_output_0"
],
"outputs": [
"/decoder/head/layer1/ConstantOfShape_output_0"
],
"attrs": {
"value": {
"dtype": "int64",
"shape": [
1
],
"data": [
0
]
}
}
},
{
"op_type": "Concat",
"name": "/decoder/head/layer1/Concat",
"inputs": [
"/decoder/head/layer1/Constant_1_output_0",
"/decoder/head/layer1/ConstantOfShape_output_0"
],
"outputs": [
"/decoder/head/layer1/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/head/layer1/Reshape",
"inputs": [
"/decoder/head/layer1/Concat_output_0",
"/decoder/head/layer1/Constant_2_output_0"
],
"outputs": [
"/decoder/head/layer1/Reshape_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Slice",
"name": "/decoder/head/layer1/Slice",
"inputs": [
"/decoder/head/layer1/Reshape_output_0",
"/decoder/head/layer1/Constant_4_output_0",
"/decoder/head/layer1/Constant_5_output_0",
"/decoder/head/layer1/Constant_3_output_0",
"/decoder/head/layer1/Constant_6_output_0"
],
"outputs": [
"/decoder/head/layer1/Slice_output_0"
],
"attrs": {}
},
{
"op_type": "Transpose",
"name": "/decoder/head/layer1/Transpose",
"inputs": [
"/decoder/head/layer1/Slice_output_0"
],
"outputs": [
"/decoder/head/layer1/Transpose_output_0"
],
"attrs": {
"perm": [
1,
0
]
}
},
{
"op_type": "Reshape",
"name": "/decoder/head/layer1/Reshape_1",
"inputs": [
"/decoder/head/layer1/Transpose_output_0",
"/decoder/head/layer1/Constant_7_output_0"
],
"outputs": [
"/decoder/head/layer1/Reshape_1_output_0"
],
"attrs": {
"allowzero": 0
}
},
{
"op_type": "Cast",
"name": "/decoder/head/layer1/Cast",
"inputs": [
"/decoder/head/layer1/Reshape_1_output_0"
],
"outputs": [
"/decoder/head/layer1/Cast_output_0"
],
"attrs": {
"to": 7
}
},
{
"op_type": "Pad",
"name": "/decoder/head/layer1/Pad",
"inputs": [
"/decoder/final_norm/BatchNormalization_output_0",
"/decoder/head/layer1/Cast_output_0"
],
"outputs": [
"/decoder/head/layer1/Pad_output_0"
],
"attrs": {
"mode": "edge"
}
},
{
"op_type": "Conv",
"name": "/decoder/head/layer1/net/Conv",
"inputs": [
"/decoder/head/layer1/Pad_output_0",
"tts.ae.decoder.head.layer1.net.weight",
"tts.ae.decoder.head.layer1.net.bias"
],
"outputs": [
"/decoder/head/layer1/net/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
3
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "PRelu",
"name": "/decoder/head/act/PRelu",
"inputs": [
"/decoder/head/layer1/net/Conv_output_0",
"onnx::PRelu_1506"
],
"outputs": [
"/decoder/head/act/PRelu_output_0"
],
"attrs": {}
},
{
"op_type": "Conv",
"name": "/decoder/head/layer2/Conv",
"inputs": [
"/decoder/head/act/PRelu_output_0",
"tts.ae.decoder.head.layer2.weight"
],
"outputs": [
"/decoder/head/layer2/Conv_output_0"
],
"attrs": {
"dilations": [
1
],
"group": 1,
"kernel_shape": [
1
],
"pads": [
0,
0
],
"strides": [
1
]
}
},
{
"op_type": "Transpose",
"name": "/decoder/head/Transpose",
"inputs": [
"/decoder/head/layer2/Conv_output_0"
],
"outputs": [
"/decoder/head/Transpose_output_0"
],
"attrs": {
"perm": [
0,
2,
1
]
}
},
{
"op_type": "Shape",
"name": "/decoder/head/Shape",
"inputs": [
"/decoder/head/Transpose_output_0"
],
"outputs": [
"/decoder/head/Shape_output_0"
],
"attrs": {}
},
{
"op_type": "Gather",
"name": "/decoder/head/Gather",
"inputs": [
"/decoder/head/Shape_output_0",
"/decoder/head/Constant_output_0"
],
"outputs": [
"/decoder/head/Gather_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Unsqueeze",
"name": "/decoder/head/Unsqueeze",
"inputs": [
"/decoder/head/Gather_output_0",
"onnx::Unsqueeze_1434"
],
"outputs": [
"/decoder/head/Unsqueeze_output_0"
],
"attrs": {}
},
{
"op_type": "Concat",
"name": "/decoder/head/Concat",
"inputs": [
"/decoder/head/Unsqueeze_output_0",
"/decoder/head/Constant_1_output_0"
],
"outputs": [
"/decoder/head/Concat_output_0"
],
"attrs": {
"axis": 0
}
},
{
"op_type": "Reshape",
"name": "/decoder/head/Reshape",
"inputs": [
"/decoder/head/Transpose_output_0",
"/decoder/head/Concat_output_0"
],
"outputs": [
"wav_tts"
],
"attrs": {
"allowzero": 0
}
}
]
}