Instructions to use mlx-community/supertonic-3 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- MLX
How to use mlx-community/supertonic-3 with MLX:
# Download the model from the Hub pip install huggingface_hub[hf_xet] huggingface-cli download --local-dir supertonic-3 mlx-community/supertonic-3
- Notebooks
- Google Colab
- Kaggle
- Local Apps
- LM Studio
| { | |
| "ir_version": 9, | |
| "opsets": [ | |
| { | |
| "domain": "", | |
| "version": 19 | |
| } | |
| ], | |
| "inputs": [ | |
| "latent" | |
| ], | |
| "outputs": [ | |
| "wav_tts" | |
| ], | |
| "weight_map": { | |
| "tts.ttl.normalizer.scale": "w000000", | |
| "tts.ae.latent_mean": "w000001", | |
| "tts.ae.latent_std": "w000002", | |
| "tts.ae.decoder.convnext.0.gamma": "w000003", | |
| "tts.ae.decoder.convnext.0.dwconv.net.weight": "w000004", | |
| "tts.ae.decoder.convnext.0.dwconv.net.bias": "w000005", | |
| "tts.ae.decoder.convnext.0.norm.norm.weight": "w000006", | |
| "tts.ae.decoder.convnext.0.norm.norm.bias": "w000007", | |
| "tts.ae.decoder.convnext.0.pwconv1.weight": "w000008", | |
| "tts.ae.decoder.convnext.0.pwconv1.bias": "w000009", | |
| "tts.ae.decoder.convnext.0.pwconv2.weight": "w000010", | |
| "tts.ae.decoder.convnext.0.pwconv2.bias": "w000011", | |
| "tts.ae.decoder.convnext.1.gamma": "w000012", | |
| "tts.ae.decoder.convnext.1.dwconv.net.weight": "w000013", | |
| "tts.ae.decoder.convnext.1.dwconv.net.bias": "w000014", | |
| "tts.ae.decoder.convnext.1.norm.norm.weight": "w000015", | |
| "tts.ae.decoder.convnext.1.norm.norm.bias": "w000016", | |
| "tts.ae.decoder.convnext.1.pwconv1.weight": "w000017", | |
| "tts.ae.decoder.convnext.1.pwconv1.bias": "w000018", | |
| "tts.ae.decoder.convnext.1.pwconv2.weight": "w000019", | |
| "tts.ae.decoder.convnext.1.pwconv2.bias": "w000020", | |
| "tts.ae.decoder.convnext.2.gamma": "w000021", | |
| "tts.ae.decoder.convnext.2.dwconv.net.weight": "w000022", | |
| "tts.ae.decoder.convnext.2.dwconv.net.bias": "w000023", | |
| "tts.ae.decoder.convnext.2.norm.norm.weight": "w000024", | |
| "tts.ae.decoder.convnext.2.norm.norm.bias": "w000025", | |
| "tts.ae.decoder.convnext.2.pwconv1.weight": "w000026", | |
| "tts.ae.decoder.convnext.2.pwconv1.bias": "w000027", | |
| "tts.ae.decoder.convnext.2.pwconv2.weight": "w000028", | |
| "tts.ae.decoder.convnext.2.pwconv2.bias": "w000029", | |
| "tts.ae.decoder.convnext.3.gamma": "w000030", | |
| "tts.ae.decoder.convnext.3.dwconv.net.weight": "w000031", | |
| "tts.ae.decoder.convnext.3.dwconv.net.bias": "w000032", | |
| "tts.ae.decoder.convnext.3.norm.norm.weight": "w000033", | |
| "tts.ae.decoder.convnext.3.norm.norm.bias": "w000034", | |
| "tts.ae.decoder.convnext.3.pwconv1.weight": "w000035", | |
| "tts.ae.decoder.convnext.3.pwconv1.bias": "w000036", | |
| "tts.ae.decoder.convnext.3.pwconv2.weight": "w000037", | |
| "tts.ae.decoder.convnext.3.pwconv2.bias": "w000038", | |
| "tts.ae.decoder.convnext.4.gamma": "w000039", | |
| "tts.ae.decoder.convnext.4.dwconv.net.weight": "w000040", | |
| "tts.ae.decoder.convnext.4.dwconv.net.bias": "w000041", | |
| "tts.ae.decoder.convnext.4.norm.norm.weight": "w000042", | |
| "tts.ae.decoder.convnext.4.norm.norm.bias": "w000043", | |
| "tts.ae.decoder.convnext.4.pwconv1.weight": "w000044", | |
| "tts.ae.decoder.convnext.4.pwconv1.bias": "w000045", | |
| "tts.ae.decoder.convnext.4.pwconv2.weight": "w000046", | |
| "tts.ae.decoder.convnext.4.pwconv2.bias": "w000047", | |
| "tts.ae.decoder.convnext.5.gamma": "w000048", | |
| "tts.ae.decoder.convnext.5.dwconv.net.weight": "w000049", | |
| "tts.ae.decoder.convnext.5.dwconv.net.bias": "w000050", | |
| "tts.ae.decoder.convnext.5.norm.norm.weight": "w000051", | |
| "tts.ae.decoder.convnext.5.norm.norm.bias": "w000052", | |
| "tts.ae.decoder.convnext.5.pwconv1.weight": "w000053", | |
| "tts.ae.decoder.convnext.5.pwconv1.bias": "w000054", | |
| "tts.ae.decoder.convnext.5.pwconv2.weight": "w000055", | |
| "tts.ae.decoder.convnext.5.pwconv2.bias": "w000056", | |
| "tts.ae.decoder.convnext.6.gamma": "w000057", | |
| "tts.ae.decoder.convnext.6.dwconv.net.weight": "w000058", | |
| "tts.ae.decoder.convnext.6.dwconv.net.bias": "w000059", | |
| "tts.ae.decoder.convnext.6.norm.norm.weight": "w000060", | |
| "tts.ae.decoder.convnext.6.norm.norm.bias": "w000061", | |
| "tts.ae.decoder.convnext.6.pwconv1.weight": "w000062", | |
| "tts.ae.decoder.convnext.6.pwconv1.bias": "w000063", | |
| "tts.ae.decoder.convnext.6.pwconv2.weight": "w000064", | |
| "tts.ae.decoder.convnext.6.pwconv2.bias": "w000065", | |
| "tts.ae.decoder.convnext.7.gamma": "w000066", | |
| "tts.ae.decoder.convnext.7.dwconv.net.weight": "w000067", | |
| "tts.ae.decoder.convnext.7.dwconv.net.bias": "w000068", | |
| "tts.ae.decoder.convnext.7.norm.norm.weight": "w000069", | |
| "tts.ae.decoder.convnext.7.norm.norm.bias": "w000070", | |
| "tts.ae.decoder.convnext.7.pwconv1.weight": "w000071", | |
| "tts.ae.decoder.convnext.7.pwconv1.bias": "w000072", | |
| "tts.ae.decoder.convnext.7.pwconv2.weight": "w000073", | |
| "tts.ae.decoder.convnext.7.pwconv2.bias": "w000074", | |
| "tts.ae.decoder.convnext.8.gamma": "w000075", | |
| "tts.ae.decoder.convnext.8.dwconv.net.weight": "w000076", | |
| "tts.ae.decoder.convnext.8.dwconv.net.bias": "w000077", | |
| "tts.ae.decoder.convnext.8.norm.norm.weight": "w000078", | |
| "tts.ae.decoder.convnext.8.norm.norm.bias": "w000079", | |
| "tts.ae.decoder.convnext.8.pwconv1.weight": "w000080", | |
| "tts.ae.decoder.convnext.8.pwconv1.bias": "w000081", | |
| "tts.ae.decoder.convnext.8.pwconv2.weight": "w000082", | |
| "tts.ae.decoder.convnext.8.pwconv2.bias": "w000083", | |
| "tts.ae.decoder.convnext.9.gamma": "w000084", | |
| "tts.ae.decoder.convnext.9.dwconv.net.weight": "w000085", | |
| "tts.ae.decoder.convnext.9.dwconv.net.bias": "w000086", | |
| "tts.ae.decoder.convnext.9.norm.norm.weight": "w000087", | |
| "tts.ae.decoder.convnext.9.norm.norm.bias": "w000088", | |
| "tts.ae.decoder.convnext.9.pwconv1.weight": "w000089", | |
| "tts.ae.decoder.convnext.9.pwconv1.bias": "w000090", | |
| "tts.ae.decoder.convnext.9.pwconv2.weight": "w000091", | |
| "tts.ae.decoder.convnext.9.pwconv2.bias": "w000092", | |
| "tts.ae.decoder.final_norm.norm.weight": "w000093", | |
| "tts.ae.decoder.final_norm.norm.bias": "w000094", | |
| "tts.ae.decoder.final_norm.norm.running_mean": "w000095", | |
| "tts.ae.decoder.final_norm.norm.running_var": "w000096", | |
| "tts.ae.decoder.head.layer1.net.weight": "w000097", | |
| "tts.ae.decoder.head.layer1.net.bias": "w000098", | |
| "tts.ae.decoder.head.layer2.weight": "w000099", | |
| "onnx::Conv_1441": "w000100", | |
| "onnx::Conv_1442": "w000101", | |
| "onnx::PRelu_1506": "w000102", | |
| "/Constant_output_0": "c000000", | |
| "/Constant_1_output_0": "c000001", | |
| "/Constant_2_output_0": "c000002", | |
| "/Constant_3_output_0": "c000003", | |
| "/Constant_4_output_0": "c000004", | |
| "onnx::Unsqueeze_967": "c000005", | |
| "/Constant_5_output_0": "c000006", | |
| "/Constant_6_output_0": "c000007", | |
| "onnx::Unsqueeze_973": "c000008", | |
| "/Constant_7_output_0": "c000009", | |
| "/Constant_8_output_0": "c000010", | |
| "onnx::Unsqueeze_984": "c000011", | |
| "onnx::Unsqueeze_986": "c000012", | |
| "/Constant_9_output_0": "c000013", | |
| "/decoder/embed/Constant_output_0": "c000014", | |
| "/decoder/embed/Constant_1_output_0": "c000015", | |
| "/decoder/embed/Constant_2_output_0": "c000016", | |
| "/decoder/embed/Constant_3_output_0": "c000017", | |
| "/decoder/embed/Constant_4_output_0": "c000018", | |
| "/decoder/embed/Constant_5_output_0": "c000019", | |
| "/decoder/embed/Constant_6_output_0": "c000020", | |
| "/decoder/embed/Constant_7_output_0": "c000021", | |
| "/decoder/convnext.0/dwconv/Constant_output_0": "c000022", | |
| "/decoder/convnext.0/dwconv/Constant_1_output_0": "c000023", | |
| "/decoder/convnext.0/dwconv/Constant_2_output_0": "c000024", | |
| "/decoder/convnext.0/dwconv/Constant_3_output_0": "c000025", | |
| "/decoder/convnext.0/dwconv/Constant_4_output_0": "c000026", | |
| "/decoder/convnext.0/dwconv/Constant_5_output_0": "c000027", | |
| "/decoder/convnext.0/dwconv/Constant_6_output_0": "c000028", | |
| "/decoder/convnext.0/dwconv/Constant_7_output_0": "c000029", | |
| "/decoder/convnext.0/act/Constant_output_0": "c000030", | |
| "/decoder/convnext.0/act/Constant_1_output_0": "c000031", | |
| "/decoder/convnext.0/act/Constant_2_output_0": "c000032", | |
| "/decoder/convnext.1/dwconv/Constant_output_0": "c000033", | |
| "/decoder/convnext.1/dwconv/Constant_1_output_0": "c000034", | |
| "/decoder/convnext.1/dwconv/Constant_2_output_0": "c000035", | |
| "/decoder/convnext.1/dwconv/Constant_3_output_0": "c000036", | |
| "/decoder/convnext.1/dwconv/Constant_4_output_0": "c000037", | |
| "/decoder/convnext.1/dwconv/Constant_5_output_0": "c000038", | |
| "/decoder/convnext.1/dwconv/Constant_6_output_0": "c000039", | |
| "/decoder/convnext.1/dwconv/Constant_7_output_0": "c000040", | |
| "/decoder/convnext.1/act/Constant_output_0": "c000041", | |
| "/decoder/convnext.1/act/Constant_1_output_0": "c000042", | |
| "/decoder/convnext.1/act/Constant_2_output_0": "c000043", | |
| "/decoder/convnext.2/dwconv/Constant_output_0": "c000044", | |
| "/decoder/convnext.2/dwconv/Constant_1_output_0": "c000045", | |
| "/decoder/convnext.2/dwconv/Constant_2_output_0": "c000046", | |
| "/decoder/convnext.2/dwconv/Constant_3_output_0": "c000047", | |
| "/decoder/convnext.2/dwconv/Constant_4_output_0": "c000048", | |
| "/decoder/convnext.2/dwconv/Constant_5_output_0": "c000049", | |
| "/decoder/convnext.2/dwconv/Constant_6_output_0": "c000050", | |
| "/decoder/convnext.2/dwconv/Constant_7_output_0": "c000051", | |
| "/decoder/convnext.2/act/Constant_output_0": "c000052", | |
| "/decoder/convnext.2/act/Constant_1_output_0": "c000053", | |
| "/decoder/convnext.2/act/Constant_2_output_0": "c000054", | |
| "/decoder/convnext.3/dwconv/Constant_output_0": "c000055", | |
| "/decoder/convnext.3/dwconv/Constant_1_output_0": "c000056", | |
| "/decoder/convnext.3/dwconv/Constant_2_output_0": "c000057", | |
| "/decoder/convnext.3/dwconv/Constant_3_output_0": "c000058", | |
| "/decoder/convnext.3/dwconv/Constant_4_output_0": "c000059", | |
| "/decoder/convnext.3/dwconv/Constant_5_output_0": "c000060", | |
| "/decoder/convnext.3/dwconv/Constant_6_output_0": "c000061", | |
| "/decoder/convnext.3/dwconv/Constant_7_output_0": "c000062", | |
| "/decoder/convnext.3/act/Constant_output_0": "c000063", | |
| "/decoder/convnext.3/act/Constant_1_output_0": "c000064", | |
| "/decoder/convnext.3/act/Constant_2_output_0": "c000065", | |
| "/decoder/convnext.4/dwconv/Constant_output_0": "c000066", | |
| "/decoder/convnext.4/dwconv/Constant_1_output_0": "c000067", | |
| "/decoder/convnext.4/dwconv/Constant_2_output_0": "c000068", | |
| "/decoder/convnext.4/dwconv/Constant_3_output_0": "c000069", | |
| "/decoder/convnext.4/dwconv/Constant_4_output_0": "c000070", | |
| "/decoder/convnext.4/dwconv/Constant_5_output_0": "c000071", | |
| "/decoder/convnext.4/dwconv/Constant_6_output_0": "c000072", | |
| "/decoder/convnext.4/dwconv/Constant_7_output_0": "c000073", | |
| "/decoder/convnext.4/act/Constant_output_0": "c000074", | |
| "/decoder/convnext.4/act/Constant_1_output_0": "c000075", | |
| "/decoder/convnext.4/act/Constant_2_output_0": "c000076", | |
| "/decoder/convnext.5/dwconv/Constant_output_0": "c000077", | |
| "/decoder/convnext.5/dwconv/Constant_1_output_0": "c000078", | |
| "/decoder/convnext.5/dwconv/Constant_2_output_0": "c000079", | |
| "/decoder/convnext.5/dwconv/Constant_3_output_0": "c000080", | |
| "/decoder/convnext.5/dwconv/Constant_4_output_0": "c000081", | |
| "/decoder/convnext.5/dwconv/Constant_5_output_0": "c000082", | |
| "/decoder/convnext.5/dwconv/Constant_6_output_0": "c000083", | |
| "/decoder/convnext.5/dwconv/Constant_7_output_0": "c000084", | |
| "/decoder/convnext.5/act/Constant_output_0": "c000085", | |
| "/decoder/convnext.5/act/Constant_1_output_0": "c000086", | |
| "/decoder/convnext.5/act/Constant_2_output_0": "c000087", | |
| "/decoder/convnext.6/dwconv/Constant_output_0": "c000088", | |
| "/decoder/convnext.6/dwconv/Constant_1_output_0": "c000089", | |
| "/decoder/convnext.6/dwconv/Constant_2_output_0": "c000090", | |
| "/decoder/convnext.6/dwconv/Constant_3_output_0": "c000091", | |
| "/decoder/convnext.6/dwconv/Constant_4_output_0": "c000092", | |
| "/decoder/convnext.6/dwconv/Constant_5_output_0": "c000093", | |
| "/decoder/convnext.6/dwconv/Constant_6_output_0": "c000094", | |
| "/decoder/convnext.6/dwconv/Constant_7_output_0": "c000095", | |
| "/decoder/convnext.6/act/Constant_output_0": "c000096", | |
| "/decoder/convnext.6/act/Constant_1_output_0": "c000097", | |
| "/decoder/convnext.6/act/Constant_2_output_0": "c000098", | |
| "/decoder/convnext.7/dwconv/Constant_output_0": "c000099", | |
| "/decoder/convnext.7/dwconv/Constant_1_output_0": "c000100", | |
| "/decoder/convnext.7/dwconv/Constant_2_output_0": "c000101", | |
| "/decoder/convnext.7/dwconv/Constant_3_output_0": "c000102", | |
| "/decoder/convnext.7/dwconv/Constant_4_output_0": "c000103", | |
| "/decoder/convnext.7/dwconv/Constant_5_output_0": "c000104", | |
| "/decoder/convnext.7/dwconv/Constant_6_output_0": "c000105", | |
| "/decoder/convnext.7/dwconv/Constant_7_output_0": "c000106", | |
| "/decoder/convnext.7/act/Constant_output_0": "c000107", | |
| "/decoder/convnext.7/act/Constant_1_output_0": "c000108", | |
| "/decoder/convnext.7/act/Constant_2_output_0": "c000109", | |
| "/decoder/convnext.8/dwconv/Constant_output_0": "c000110", | |
| "/decoder/convnext.8/dwconv/Constant_1_output_0": "c000111", | |
| "/decoder/convnext.8/dwconv/Constant_2_output_0": "c000112", | |
| "/decoder/convnext.8/dwconv/Constant_3_output_0": "c000113", | |
| "/decoder/convnext.8/dwconv/Constant_4_output_0": "c000114", | |
| "/decoder/convnext.8/dwconv/Constant_5_output_0": "c000115", | |
| "/decoder/convnext.8/dwconv/Constant_6_output_0": "c000116", | |
| "/decoder/convnext.8/dwconv/Constant_7_output_0": "c000117", | |
| "/decoder/convnext.8/act/Constant_output_0": "c000118", | |
| "/decoder/convnext.8/act/Constant_1_output_0": "c000119", | |
| "/decoder/convnext.8/act/Constant_2_output_0": "c000120", | |
| "/decoder/convnext.9/dwconv/Constant_output_0": "c000121", | |
| "/decoder/convnext.9/dwconv/Constant_1_output_0": "c000122", | |
| "/decoder/convnext.9/dwconv/Constant_2_output_0": "c000123", | |
| "/decoder/convnext.9/dwconv/Constant_3_output_0": "c000124", | |
| "/decoder/convnext.9/dwconv/Constant_4_output_0": "c000125", | |
| "/decoder/convnext.9/dwconv/Constant_5_output_0": "c000126", | |
| "/decoder/convnext.9/dwconv/Constant_6_output_0": "c000127", | |
| "/decoder/convnext.9/dwconv/Constant_7_output_0": "c000128", | |
| "/decoder/convnext.9/act/Constant_output_0": "c000129", | |
| "/decoder/convnext.9/act/Constant_1_output_0": "c000130", | |
| "/decoder/convnext.9/act/Constant_2_output_0": "c000131", | |
| "/decoder/head/layer1/Constant_output_0": "c000132", | |
| "/decoder/head/layer1/Constant_1_output_0": "c000133", | |
| "/decoder/head/layer1/Constant_2_output_0": "c000134", | |
| "/decoder/head/layer1/Constant_3_output_0": "c000135", | |
| "/decoder/head/layer1/Constant_4_output_0": "c000136", | |
| "/decoder/head/layer1/Constant_5_output_0": "c000137", | |
| "/decoder/head/layer1/Constant_6_output_0": "c000138", | |
| "/decoder/head/layer1/Constant_7_output_0": "c000139", | |
| "/decoder/head/Constant_output_0": "c000140", | |
| "onnx::Unsqueeze_1434": "c000141", | |
| "/decoder/head/Constant_1_output_0": "c000142" | |
| }, | |
| "nodes": [ | |
| { | |
| "op_type": "Div", | |
| "name": "/Div", | |
| "inputs": [ | |
| "latent", | |
| "tts.ttl.normalizer.scale" | |
| ], | |
| "outputs": [ | |
| "/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Shape", | |
| "name": "/Shape", | |
| "inputs": [ | |
| "/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/Shape_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Gather", | |
| "name": "/Gather", | |
| "inputs": [ | |
| "/Shape_output_0", | |
| "/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/Gather_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Shape", | |
| "name": "/Shape_1", | |
| "inputs": [ | |
| "/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/Shape_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/Slice", | |
| "inputs": [ | |
| "/Shape_1_output_0", | |
| "/Constant_2_output_0", | |
| "/Constant_3_output_0", | |
| "/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Squeeze", | |
| "name": "/Squeeze", | |
| "inputs": [ | |
| "/Slice_output_0", | |
| "/Constant_4_output_0" | |
| ], | |
| "outputs": [ | |
| "/Squeeze_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Unsqueeze", | |
| "name": "/Unsqueeze", | |
| "inputs": [ | |
| "/Gather_output_0", | |
| "onnx::Unsqueeze_967" | |
| ], | |
| "outputs": [ | |
| "/Unsqueeze_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Unsqueeze", | |
| "name": "/Unsqueeze_1", | |
| "inputs": [ | |
| "/Squeeze_output_0", | |
| "onnx::Unsqueeze_973" | |
| ], | |
| "outputs": [ | |
| "/Unsqueeze_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/Concat", | |
| "inputs": [ | |
| "/Unsqueeze_output_0", | |
| "/Constant_5_output_0", | |
| "/Constant_6_output_0", | |
| "/Unsqueeze_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/Reshape", | |
| "inputs": [ | |
| "/Div_output_0", | |
| "/Concat_output_0" | |
| ], | |
| "outputs": [ | |
| "/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/Transpose", | |
| "inputs": [ | |
| "/Reshape_output_0" | |
| ], | |
| "outputs": [ | |
| "/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 1, | |
| 3, | |
| 2 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Shape", | |
| "name": "/Shape_2", | |
| "inputs": [ | |
| "/Transpose_output_0" | |
| ], | |
| "outputs": [ | |
| "/Shape_2_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Gather", | |
| "name": "/Gather_1", | |
| "inputs": [ | |
| "/Shape_2_output_0", | |
| "/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/Gather_1_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Shape", | |
| "name": "/Shape_3", | |
| "inputs": [ | |
| "/Transpose_output_0" | |
| ], | |
| "outputs": [ | |
| "/Shape_3_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Gather", | |
| "name": "/Gather_2", | |
| "inputs": [ | |
| "/Shape_3_output_0", | |
| "/Constant_8_output_0" | |
| ], | |
| "outputs": [ | |
| "/Gather_2_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Unsqueeze", | |
| "name": "/Unsqueeze_2", | |
| "inputs": [ | |
| "/Gather_1_output_0", | |
| "onnx::Unsqueeze_984" | |
| ], | |
| "outputs": [ | |
| "/Unsqueeze_2_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Unsqueeze", | |
| "name": "/Unsqueeze_3", | |
| "inputs": [ | |
| "/Gather_2_output_0", | |
| "onnx::Unsqueeze_986" | |
| ], | |
| "outputs": [ | |
| "/Unsqueeze_3_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/Concat_1", | |
| "inputs": [ | |
| "/Unsqueeze_2_output_0", | |
| "/Unsqueeze_3_output_0", | |
| "/Constant_9_output_0" | |
| ], | |
| "outputs": [ | |
| "/Concat_1_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/Reshape_1", | |
| "inputs": [ | |
| "/Transpose_output_0", | |
| "/Concat_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/Mul", | |
| "inputs": [ | |
| "/Reshape_1_output_0", | |
| "tts.ae.latent_std" | |
| ], | |
| "outputs": [ | |
| "/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/Add", | |
| "inputs": [ | |
| "/Mul_output_0", | |
| "tts.ae.latent_mean" | |
| ], | |
| "outputs": [ | |
| "/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/embed/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/embed/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/embed/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/embed/Concat", | |
| "inputs": [ | |
| "/decoder/embed/Constant_1_output_0", | |
| "/decoder/embed/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/embed/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/embed/Reshape", | |
| "inputs": [ | |
| "/decoder/embed/Concat_output_0", | |
| "/decoder/embed/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/embed/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/embed/Slice", | |
| "inputs": [ | |
| "/decoder/embed/Reshape_output_0", | |
| "/decoder/embed/Constant_4_output_0", | |
| "/decoder/embed/Constant_5_output_0", | |
| "/decoder/embed/Constant_3_output_0", | |
| "/decoder/embed/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/embed/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/embed/Transpose", | |
| "inputs": [ | |
| "/decoder/embed/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/embed/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/embed/Reshape_1", | |
| "inputs": [ | |
| "/decoder/embed/Transpose_output_0", | |
| "/decoder/embed/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/embed/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/embed/Cast", | |
| "inputs": [ | |
| "/decoder/embed/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/embed/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/embed/Pad", | |
| "inputs": [ | |
| "/Add_output_0", | |
| "/decoder/embed/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/embed/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/embed/net/Conv", | |
| "inputs": [ | |
| "/decoder/embed/Pad_output_0", | |
| "onnx::Conv_1441", | |
| "onnx::Conv_1442" | |
| ], | |
| "outputs": [ | |
| "/decoder/embed/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.0/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.0/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.0/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.0/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.0/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.0/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.0/dwconv/Concat_output_0", | |
| "/decoder/convnext.0/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.0/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.0/dwconv/Reshape_output_0", | |
| "/decoder/convnext.0/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.0/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.0/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.0/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.0/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.0/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.0/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.0/dwconv/Transpose_output_0", | |
| "/decoder/convnext.0/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.0/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.0/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.0/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/embed/net/Conv_output_0", | |
| "/decoder/convnext.0/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.0/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.0/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.0.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.0.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.0/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.0/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.0/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.0/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.0.norm.norm.weight", | |
| "tts.ae.decoder.convnext.0.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.0/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.0/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.0/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.0/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.0.pwconv1.weight", | |
| "tts.ae.decoder.convnext.0.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.0/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.0/pwconv1/Conv_output_0", | |
| "/decoder/convnext.0/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.0/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.0/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.0/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.0/act/Erf_output_0", | |
| "/decoder/convnext.0/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.0/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.0/pwconv1/Conv_output_0", | |
| "/decoder/convnext.0/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.0/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.0/act/Mul_output_0", | |
| "/decoder/convnext.0/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.0/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.0/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.0.pwconv2.weight", | |
| "tts.ae.decoder.convnext.0.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.0/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.0.gamma", | |
| "/decoder/convnext.0/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.0/Add", | |
| "inputs": [ | |
| "/decoder/embed/net/Conv_output_0", | |
| "/decoder/convnext.0/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.0/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.1/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.1/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.1/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.1/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.1/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.1/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.1/dwconv/Concat_output_0", | |
| "/decoder/convnext.1/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.1/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.1/dwconv/Reshape_output_0", | |
| "/decoder/convnext.1/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.1/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.1/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.1/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.1/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.1/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.1/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.1/dwconv/Transpose_output_0", | |
| "/decoder/convnext.1/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.1/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.1/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.1/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/convnext.0/Add_output_0", | |
| "/decoder/convnext.1/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.1/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.1/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.1.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.1.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 2 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.1/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.1/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.1/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.1/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.1.norm.norm.weight", | |
| "tts.ae.decoder.convnext.1.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.1/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.1/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.1/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.1/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.1.pwconv1.weight", | |
| "tts.ae.decoder.convnext.1.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.1/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.1/pwconv1/Conv_output_0", | |
| "/decoder/convnext.1/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.1/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.1/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.1/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.1/act/Erf_output_0", | |
| "/decoder/convnext.1/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.1/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.1/pwconv1/Conv_output_0", | |
| "/decoder/convnext.1/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.1/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.1/act/Mul_output_0", | |
| "/decoder/convnext.1/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.1/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.1/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.1.pwconv2.weight", | |
| "tts.ae.decoder.convnext.1.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.1/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.1.gamma", | |
| "/decoder/convnext.1/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.1/Add", | |
| "inputs": [ | |
| "/decoder/convnext.0/Add_output_0", | |
| "/decoder/convnext.1/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.1/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.2/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.2/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.2/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.2/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.2/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.2/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.2/dwconv/Concat_output_0", | |
| "/decoder/convnext.2/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.2/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.2/dwconv/Reshape_output_0", | |
| "/decoder/convnext.2/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.2/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.2/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.2/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.2/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.2/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.2/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.2/dwconv/Transpose_output_0", | |
| "/decoder/convnext.2/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.2/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.2/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.2/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/convnext.1/Add_output_0", | |
| "/decoder/convnext.2/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.2/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.2/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.2.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.2.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 4 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.2/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.2/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.2/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.2/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.2.norm.norm.weight", | |
| "tts.ae.decoder.convnext.2.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.2/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.2/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.2/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.2/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.2.pwconv1.weight", | |
| "tts.ae.decoder.convnext.2.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.2/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.2/pwconv1/Conv_output_0", | |
| "/decoder/convnext.2/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.2/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.2/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.2/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.2/act/Erf_output_0", | |
| "/decoder/convnext.2/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.2/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.2/pwconv1/Conv_output_0", | |
| "/decoder/convnext.2/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.2/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.2/act/Mul_output_0", | |
| "/decoder/convnext.2/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.2/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.2/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.2.pwconv2.weight", | |
| "tts.ae.decoder.convnext.2.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.2/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.2.gamma", | |
| "/decoder/convnext.2/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.2/Add", | |
| "inputs": [ | |
| "/decoder/convnext.1/Add_output_0", | |
| "/decoder/convnext.2/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.2/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.3/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.3/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.3/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.3/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.3/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.3/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.3/dwconv/Concat_output_0", | |
| "/decoder/convnext.3/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.3/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.3/dwconv/Reshape_output_0", | |
| "/decoder/convnext.3/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.3/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.3/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.3/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.3/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.3/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.3/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.3/dwconv/Transpose_output_0", | |
| "/decoder/convnext.3/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.3/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.3/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.3/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/convnext.2/Add_output_0", | |
| "/decoder/convnext.3/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.3/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.3/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.3.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.3.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.3/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.3/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.3/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.3/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.3.norm.norm.weight", | |
| "tts.ae.decoder.convnext.3.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.3/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.3/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.3/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.3/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.3.pwconv1.weight", | |
| "tts.ae.decoder.convnext.3.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.3/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.3/pwconv1/Conv_output_0", | |
| "/decoder/convnext.3/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.3/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.3/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.3/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.3/act/Erf_output_0", | |
| "/decoder/convnext.3/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.3/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.3/pwconv1/Conv_output_0", | |
| "/decoder/convnext.3/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.3/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.3/act/Mul_output_0", | |
| "/decoder/convnext.3/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.3/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.3/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.3.pwconv2.weight", | |
| "tts.ae.decoder.convnext.3.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.3/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.3.gamma", | |
| "/decoder/convnext.3/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.3/Add", | |
| "inputs": [ | |
| "/decoder/convnext.2/Add_output_0", | |
| "/decoder/convnext.3/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.3/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.4/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.4/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.4/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.4/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.4/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.4/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.4/dwconv/Concat_output_0", | |
| "/decoder/convnext.4/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.4/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.4/dwconv/Reshape_output_0", | |
| "/decoder/convnext.4/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.4/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.4/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.4/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.4/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.4/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.4/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.4/dwconv/Transpose_output_0", | |
| "/decoder/convnext.4/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.4/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.4/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.4/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/convnext.3/Add_output_0", | |
| "/decoder/convnext.4/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.4/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.4/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.4.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.4.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 2 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.4/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.4/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.4/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.4/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.4.norm.norm.weight", | |
| "tts.ae.decoder.convnext.4.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.4/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.4/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.4/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.4/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.4.pwconv1.weight", | |
| "tts.ae.decoder.convnext.4.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.4/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.4/pwconv1/Conv_output_0", | |
| "/decoder/convnext.4/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.4/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.4/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.4/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.4/act/Erf_output_0", | |
| "/decoder/convnext.4/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.4/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.4/pwconv1/Conv_output_0", | |
| "/decoder/convnext.4/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.4/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.4/act/Mul_output_0", | |
| "/decoder/convnext.4/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.4/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.4/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.4.pwconv2.weight", | |
| "tts.ae.decoder.convnext.4.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.4/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.4.gamma", | |
| "/decoder/convnext.4/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.4/Add", | |
| "inputs": [ | |
| "/decoder/convnext.3/Add_output_0", | |
| "/decoder/convnext.4/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.4/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.5/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.5/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.5/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.5/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.5/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.5/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.5/dwconv/Concat_output_0", | |
| "/decoder/convnext.5/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.5/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.5/dwconv/Reshape_output_0", | |
| "/decoder/convnext.5/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.5/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.5/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.5/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.5/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.5/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.5/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.5/dwconv/Transpose_output_0", | |
| "/decoder/convnext.5/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.5/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.5/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.5/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/convnext.4/Add_output_0", | |
| "/decoder/convnext.5/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.5/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.5/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.5.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.5.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 4 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.5/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.5/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.5/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.5/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.5.norm.norm.weight", | |
| "tts.ae.decoder.convnext.5.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.5/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.5/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.5/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.5/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.5.pwconv1.weight", | |
| "tts.ae.decoder.convnext.5.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.5/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.5/pwconv1/Conv_output_0", | |
| "/decoder/convnext.5/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.5/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.5/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.5/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.5/act/Erf_output_0", | |
| "/decoder/convnext.5/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.5/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.5/pwconv1/Conv_output_0", | |
| "/decoder/convnext.5/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.5/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.5/act/Mul_output_0", | |
| "/decoder/convnext.5/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.5/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.5/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.5.pwconv2.weight", | |
| "tts.ae.decoder.convnext.5.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.5/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.5.gamma", | |
| "/decoder/convnext.5/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.5/Add", | |
| "inputs": [ | |
| "/decoder/convnext.4/Add_output_0", | |
| "/decoder/convnext.5/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.5/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.6/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.6/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.6/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.6/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.6/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.6/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.6/dwconv/Concat_output_0", | |
| "/decoder/convnext.6/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.6/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.6/dwconv/Reshape_output_0", | |
| "/decoder/convnext.6/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.6/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.6/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.6/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.6/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.6/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.6/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.6/dwconv/Transpose_output_0", | |
| "/decoder/convnext.6/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.6/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.6/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.6/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/convnext.5/Add_output_0", | |
| "/decoder/convnext.6/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.6/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.6/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.6.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.6.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.6/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.6/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.6/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.6/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.6.norm.norm.weight", | |
| "tts.ae.decoder.convnext.6.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.6/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.6/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.6/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.6/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.6.pwconv1.weight", | |
| "tts.ae.decoder.convnext.6.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.6/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.6/pwconv1/Conv_output_0", | |
| "/decoder/convnext.6/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.6/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.6/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.6/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.6/act/Erf_output_0", | |
| "/decoder/convnext.6/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.6/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.6/pwconv1/Conv_output_0", | |
| "/decoder/convnext.6/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.6/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.6/act/Mul_output_0", | |
| "/decoder/convnext.6/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.6/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.6/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.6.pwconv2.weight", | |
| "tts.ae.decoder.convnext.6.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.6/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.6.gamma", | |
| "/decoder/convnext.6/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.6/Add", | |
| "inputs": [ | |
| "/decoder/convnext.5/Add_output_0", | |
| "/decoder/convnext.6/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.6/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.7/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.7/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.7/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.7/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.7/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.7/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.7/dwconv/Concat_output_0", | |
| "/decoder/convnext.7/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.7/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.7/dwconv/Reshape_output_0", | |
| "/decoder/convnext.7/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.7/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.7/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.7/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.7/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.7/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.7/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.7/dwconv/Transpose_output_0", | |
| "/decoder/convnext.7/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.7/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.7/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.7/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/convnext.6/Add_output_0", | |
| "/decoder/convnext.7/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.7/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.7/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.7.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.7.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.7/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.7/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.7/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.7/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.7.norm.norm.weight", | |
| "tts.ae.decoder.convnext.7.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.7/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.7/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.7/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.7/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.7.pwconv1.weight", | |
| "tts.ae.decoder.convnext.7.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.7/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.7/pwconv1/Conv_output_0", | |
| "/decoder/convnext.7/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.7/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.7/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.7/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.7/act/Erf_output_0", | |
| "/decoder/convnext.7/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.7/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.7/pwconv1/Conv_output_0", | |
| "/decoder/convnext.7/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.7/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.7/act/Mul_output_0", | |
| "/decoder/convnext.7/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.7/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.7/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.7.pwconv2.weight", | |
| "tts.ae.decoder.convnext.7.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.7/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.7.gamma", | |
| "/decoder/convnext.7/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.7/Add", | |
| "inputs": [ | |
| "/decoder/convnext.6/Add_output_0", | |
| "/decoder/convnext.7/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.7/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.8/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.8/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.8/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.8/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.8/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.8/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.8/dwconv/Concat_output_0", | |
| "/decoder/convnext.8/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.8/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.8/dwconv/Reshape_output_0", | |
| "/decoder/convnext.8/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.8/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.8/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.8/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.8/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.8/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.8/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.8/dwconv/Transpose_output_0", | |
| "/decoder/convnext.8/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.8/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.8/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.8/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/convnext.7/Add_output_0", | |
| "/decoder/convnext.8/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.8/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.8/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.8.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.8.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.8/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.8/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.8/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.8/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.8.norm.norm.weight", | |
| "tts.ae.decoder.convnext.8.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.8/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.8/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.8/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.8/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.8.pwconv1.weight", | |
| "tts.ae.decoder.convnext.8.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.8/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.8/pwconv1/Conv_output_0", | |
| "/decoder/convnext.8/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.8/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.8/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.8/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.8/act/Erf_output_0", | |
| "/decoder/convnext.8/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.8/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.8/pwconv1/Conv_output_0", | |
| "/decoder/convnext.8/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.8/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.8/act/Mul_output_0", | |
| "/decoder/convnext.8/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.8/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.8/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.8.pwconv2.weight", | |
| "tts.ae.decoder.convnext.8.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.8/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.8.gamma", | |
| "/decoder/convnext.8/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.8/Add", | |
| "inputs": [ | |
| "/decoder/convnext.7/Add_output_0", | |
| "/decoder/convnext.8/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.8/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/convnext.9/dwconv/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/convnext.9/dwconv/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/convnext.9/dwconv/Concat", | |
| "inputs": [ | |
| "/decoder/convnext.9/dwconv/Constant_1_output_0", | |
| "/decoder/convnext.9/dwconv/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/dwconv/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.9/dwconv/Reshape", | |
| "inputs": [ | |
| "/decoder/convnext.9/dwconv/Concat_output_0", | |
| "/decoder/convnext.9/dwconv/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/dwconv/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/convnext.9/dwconv/Slice", | |
| "inputs": [ | |
| "/decoder/convnext.9/dwconv/Reshape_output_0", | |
| "/decoder/convnext.9/dwconv/Constant_4_output_0", | |
| "/decoder/convnext.9/dwconv/Constant_5_output_0", | |
| "/decoder/convnext.9/dwconv/Constant_3_output_0", | |
| "/decoder/convnext.9/dwconv/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/dwconv/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.9/dwconv/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.9/dwconv/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/dwconv/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/convnext.9/dwconv/Reshape_1", | |
| "inputs": [ | |
| "/decoder/convnext.9/dwconv/Transpose_output_0", | |
| "/decoder/convnext.9/dwconv/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/dwconv/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/convnext.9/dwconv/Cast", | |
| "inputs": [ | |
| "/decoder/convnext.9/dwconv/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/dwconv/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/convnext.9/dwconv/Pad", | |
| "inputs": [ | |
| "/decoder/convnext.8/Add_output_0", | |
| "/decoder/convnext.9/dwconv/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/dwconv/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.9/dwconv/net/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.9/dwconv/Pad_output_0", | |
| "tts.ae.decoder.convnext.9.dwconv.net.weight", | |
| "tts.ae.decoder.convnext.9.dwconv.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/dwconv/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 512, | |
| "kernel_shape": [ | |
| 7 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.9/norm/Transpose", | |
| "inputs": [ | |
| "/decoder/convnext.9/dwconv/net/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/norm/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "LayerNormalization", | |
| "name": "/decoder/convnext.9/norm/norm/LayerNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.9/norm/Transpose_output_0", | |
| "tts.ae.decoder.convnext.9.norm.norm.weight", | |
| "tts.ae.decoder.convnext.9.norm.norm.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "axis": -1, | |
| "epsilon": 9.999999974752427e-07 | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/convnext.9/norm/Transpose_1", | |
| "inputs": [ | |
| "/decoder/convnext.9/norm/norm/LayerNormalization_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/norm/Transpose_1_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.9/pwconv1/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.9/norm/Transpose_1_output_0", | |
| "tts.ae.decoder.convnext.9.pwconv1.weight", | |
| "tts.ae.decoder.convnext.9.pwconv1.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/pwconv1/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Div", | |
| "name": "/decoder/convnext.9/act/Div", | |
| "inputs": [ | |
| "/decoder/convnext.9/pwconv1/Conv_output_0", | |
| "/decoder/convnext.9/act/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/act/Div_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Erf", | |
| "name": "/decoder/convnext.9/act/Erf", | |
| "inputs": [ | |
| "/decoder/convnext.9/act/Div_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/act/Erf_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.9/act/Add", | |
| "inputs": [ | |
| "/decoder/convnext.9/act/Erf_output_0", | |
| "/decoder/convnext.9/act/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/act/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.9/act/Mul", | |
| "inputs": [ | |
| "/decoder/convnext.9/pwconv1/Conv_output_0", | |
| "/decoder/convnext.9/act/Add_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/act/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.9/act/Mul_1", | |
| "inputs": [ | |
| "/decoder/convnext.9/act/Mul_output_0", | |
| "/decoder/convnext.9/act/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/act/Mul_1_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/convnext.9/pwconv2/Conv", | |
| "inputs": [ | |
| "/decoder/convnext.9/act/Mul_1_output_0", | |
| "tts.ae.decoder.convnext.9.pwconv2.weight", | |
| "tts.ae.decoder.convnext.9.pwconv2.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/pwconv2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Mul", | |
| "name": "/decoder/convnext.9/Mul", | |
| "inputs": [ | |
| "tts.ae.decoder.convnext.9.gamma", | |
| "/decoder/convnext.9/pwconv2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/Mul_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Add", | |
| "name": "/decoder/convnext.9/Add", | |
| "inputs": [ | |
| "/decoder/convnext.8/Add_output_0", | |
| "/decoder/convnext.9/Mul_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/convnext.9/Add_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "BatchNormalization", | |
| "name": "/decoder/final_norm/BatchNormalization", | |
| "inputs": [ | |
| "/decoder/convnext.9/Add_output_0", | |
| "tts.ae.decoder.final_norm.norm.weight", | |
| "tts.ae.decoder.final_norm.norm.bias", | |
| "tts.ae.decoder.final_norm.norm.running_mean", | |
| "tts.ae.decoder.final_norm.norm.running_var" | |
| ], | |
| "outputs": [ | |
| "/decoder/final_norm/BatchNormalization_output_0" | |
| ], | |
| "attrs": { | |
| "epsilon": 9.999999747378752e-06, | |
| "momentum": 0.8999999761581421, | |
| "training_mode": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "ConstantOfShape", | |
| "name": "/decoder/head/layer1/ConstantOfShape", | |
| "inputs": [ | |
| "/decoder/head/layer1/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer1/ConstantOfShape_output_0" | |
| ], | |
| "attrs": { | |
| "value": { | |
| "dtype": "int64", | |
| "shape": [ | |
| 1 | |
| ], | |
| "data": [ | |
| 0 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/head/layer1/Concat", | |
| "inputs": [ | |
| "/decoder/head/layer1/Constant_1_output_0", | |
| "/decoder/head/layer1/ConstantOfShape_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer1/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/head/layer1/Reshape", | |
| "inputs": [ | |
| "/decoder/head/layer1/Concat_output_0", | |
| "/decoder/head/layer1/Constant_2_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer1/Reshape_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Slice", | |
| "name": "/decoder/head/layer1/Slice", | |
| "inputs": [ | |
| "/decoder/head/layer1/Reshape_output_0", | |
| "/decoder/head/layer1/Constant_4_output_0", | |
| "/decoder/head/layer1/Constant_5_output_0", | |
| "/decoder/head/layer1/Constant_3_output_0", | |
| "/decoder/head/layer1/Constant_6_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer1/Slice_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/head/layer1/Transpose", | |
| "inputs": [ | |
| "/decoder/head/layer1/Slice_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer1/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 1, | |
| 0 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/head/layer1/Reshape_1", | |
| "inputs": [ | |
| "/decoder/head/layer1/Transpose_output_0", | |
| "/decoder/head/layer1/Constant_7_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer1/Reshape_1_output_0" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Cast", | |
| "name": "/decoder/head/layer1/Cast", | |
| "inputs": [ | |
| "/decoder/head/layer1/Reshape_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer1/Cast_output_0" | |
| ], | |
| "attrs": { | |
| "to": 7 | |
| } | |
| }, | |
| { | |
| "op_type": "Pad", | |
| "name": "/decoder/head/layer1/Pad", | |
| "inputs": [ | |
| "/decoder/final_norm/BatchNormalization_output_0", | |
| "/decoder/head/layer1/Cast_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer1/Pad_output_0" | |
| ], | |
| "attrs": { | |
| "mode": "edge" | |
| } | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/head/layer1/net/Conv", | |
| "inputs": [ | |
| "/decoder/head/layer1/Pad_output_0", | |
| "tts.ae.decoder.head.layer1.net.weight", | |
| "tts.ae.decoder.head.layer1.net.bias" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer1/net/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 3 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "PRelu", | |
| "name": "/decoder/head/act/PRelu", | |
| "inputs": [ | |
| "/decoder/head/layer1/net/Conv_output_0", | |
| "onnx::PRelu_1506" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/act/PRelu_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Conv", | |
| "name": "/decoder/head/layer2/Conv", | |
| "inputs": [ | |
| "/decoder/head/act/PRelu_output_0", | |
| "tts.ae.decoder.head.layer2.weight" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/layer2/Conv_output_0" | |
| ], | |
| "attrs": { | |
| "dilations": [ | |
| 1 | |
| ], | |
| "group": 1, | |
| "kernel_shape": [ | |
| 1 | |
| ], | |
| "pads": [ | |
| 0, | |
| 0 | |
| ], | |
| "strides": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Transpose", | |
| "name": "/decoder/head/Transpose", | |
| "inputs": [ | |
| "/decoder/head/layer2/Conv_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/Transpose_output_0" | |
| ], | |
| "attrs": { | |
| "perm": [ | |
| 0, | |
| 2, | |
| 1 | |
| ] | |
| } | |
| }, | |
| { | |
| "op_type": "Shape", | |
| "name": "/decoder/head/Shape", | |
| "inputs": [ | |
| "/decoder/head/Transpose_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/Shape_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Gather", | |
| "name": "/decoder/head/Gather", | |
| "inputs": [ | |
| "/decoder/head/Shape_output_0", | |
| "/decoder/head/Constant_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/Gather_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Unsqueeze", | |
| "name": "/decoder/head/Unsqueeze", | |
| "inputs": [ | |
| "/decoder/head/Gather_output_0", | |
| "onnx::Unsqueeze_1434" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/Unsqueeze_output_0" | |
| ], | |
| "attrs": {} | |
| }, | |
| { | |
| "op_type": "Concat", | |
| "name": "/decoder/head/Concat", | |
| "inputs": [ | |
| "/decoder/head/Unsqueeze_output_0", | |
| "/decoder/head/Constant_1_output_0" | |
| ], | |
| "outputs": [ | |
| "/decoder/head/Concat_output_0" | |
| ], | |
| "attrs": { | |
| "axis": 0 | |
| } | |
| }, | |
| { | |
| "op_type": "Reshape", | |
| "name": "/decoder/head/Reshape", | |
| "inputs": [ | |
| "/decoder/head/Transpose_output_0", | |
| "/decoder/head/Concat_output_0" | |
| ], | |
| "outputs": [ | |
| "wav_tts" | |
| ], | |
| "attrs": { | |
| "allowzero": 0 | |
| } | |
| } | |
| ] | |
| } |