ACE-Step-v1-ov-int4 / ov_vocoder_mel_transform_model.xml
rippertnt's picture
Upload 18 files
9dc8183 verified
<?xml version="1.0"?>
<net name="Model9" version="11">
<layers>
<layer id="0" name="x" type="Parameter" version="opset1">
<data shape="?,?" element_type="f32" />
<output>
<port id="0" precision="FP32" names="x">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="1" name="21" type="Const" version="opset1">
<data element_type="i64" shape="" offset="0" size="8" />
<output>
<port id="0" precision="I64" names="21" />
</output>
</layer>
<layer id="2" name="__module.spectrogram/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="FP32" names="23,input.1">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="3" name="__module.spectrogram/aten::pad/Concat" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="8" size="24" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="4" name="__module.spectrogram/aten::pad/ConvertLike_1_compressed" type="Const" version="opset1">
<data element_type="f16" shape="" offset="32" size="2" />
<output>
<port id="0" precision="FP16" />
</output>
</layer>
<layer id="5" name="__module.spectrogram/aten::pad/ConvertLike_1" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16" />
</input>
<output>
<port id="1" precision="FP32" />
</output>
</layer>
<layer id="6" name="__module.spectrogram/aten::pad/Pad" type="Pad" version="opset12">
<data pad_mode="reflect" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
<port id="2" precision="I64">
<dim>3</dim>
</port>
<port id="3" precision="FP32" />
</input>
<output>
<port id="4" precision="FP32" names="25">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="7" name="__module.spectrogram/aten::squeeze/Squeeze" type="Squeeze" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="FP32" names="26,27,input,y">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="8" name="self.spectrogram.window_compressed" type="Const" version="opset1">
<data element_type="f16" shape="2048" offset="34" size="4096" />
<output>
<port id="0" precision="FP16" names="self.spectrogram.window">
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="9" name="self.spectrogram.window" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>2048</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>2048</dim>
</port>
</output>
</layer>
<layer id="10" name="15" type="Const" version="opset1">
<data element_type="i64" shape="" offset="4130" size="8" />
<output>
<port id="0" precision="I64" names="15" />
</output>
</layer>
<layer id="11" name="14" type="Const" version="opset1">
<data element_type="i64" shape="" offset="4138" size="8" />
<output>
<port id="0" precision="I64" names="14" />
</output>
</layer>
<layer id="12" name="__module.spectrogram/aten::stft/STFT" type="STFT" version="opset15">
<data transpose_frames="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>2048</dim>
</port>
<port id="2" precision="I64" />
<port id="3" precision="I64" />
</input>
<output>
<port id="4" precision="FP32" names="29,spec.3">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
<dim>2</dim>
</port>
</output>
</layer>
<layer id="13" name="Constant_121258_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 1, 1" offset="4146" size="2" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="14" name="Constant_121258" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="15" name="__module.spectrogram/aten::pow/Power" type="Power" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
<dim>2</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="30">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
<dim>2</dim>
</port>
</output>
</layer>
<layer id="16" name="Constant_118930" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="4148" size="8" />
<output>
<port id="0" precision="I64" names="31">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="17" name="__module.spectrogram/aten::sum/ReduceSum" type="ReduceSum" version="opset1">
<data keep_dims="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
<dim>2</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="32">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="18" name="Constant_121259_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 1" offset="4156" size="2" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="19" name="Constant_121259" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="20" name="__module.spectrogram/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="33">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="21" name="__module.spectrogram/aten::sqrt/Sqrt" type="Sqrt" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="34,35,spec,specgram">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="22" name="Transpose_121127_compressed" type="Const" version="opset1">
<data element_type="f16" shape="128, 1025" offset="4158" size="262400" />
<output>
<port id="0" precision="FP16">
<dim>128</dim>
<dim>1025</dim>
</port>
</output>
</layer>
<layer id="23" name="Transpose_121127" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>128</dim>
<dim>1025</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>128</dim>
<dim>1025</dim>
</port>
</output>
</layer>
<layer id="24" name="__module.mel_scale/aten::matmul/MatMul" type="MatMul" version="opset1">
<data transpose_a="true" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1025</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>128</dim>
<dim>1025</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="40">
<dim>-1</dim>
<dim>-1</dim>
<dim>128</dim>
</port>
</output>
</layer>
<layer id="25" name="__module.mel_scale/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="3" offset="266558" size="12" />
<output>
<port id="0" precision="I32">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="26" name="__module.mel_scale/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>128</dim>
</port>
<port id="1" precision="I32">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="41,x_1">
<dim>-1</dim>
<dim>128</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="27" name="Constant_121260_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 1" offset="266570" size="2" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="28" name="Constant_121260" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="29" name="aten::clamp/Maximum" type="Maximum" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>128</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="8">
<dim>-1</dim>
<dim>128</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="30" name="aten::log/Log" type="Log" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>128</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>128</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="31" name="Result_119110" type="Result" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>128</dim>
<dim>-1</dim>
</port>
</input>
</layer>
</layers>
<edges>
<edge from-layer="0" from-port="0" to-layer="2" to-port="0" />
<edge from-layer="1" from-port="0" to-layer="7" to-port="1" />
<edge from-layer="1" from-port="0" to-layer="2" to-port="1" />
<edge from-layer="2" from-port="2" to-layer="6" to-port="0" />
<edge from-layer="3" from-port="0" to-layer="6" to-port="1" />
<edge from-layer="3" from-port="0" to-layer="6" to-port="2" />
<edge from-layer="4" from-port="0" to-layer="5" to-port="0" />
<edge from-layer="5" from-port="1" to-layer="6" to-port="3" />
<edge from-layer="6" from-port="4" to-layer="7" to-port="0" />
<edge from-layer="7" from-port="2" to-layer="12" to-port="0" />
<edge from-layer="8" from-port="0" to-layer="9" to-port="0" />
<edge from-layer="9" from-port="1" to-layer="12" to-port="1" />
<edge from-layer="10" from-port="0" to-layer="12" to-port="2" />
<edge from-layer="11" from-port="0" to-layer="12" to-port="3" />
<edge from-layer="12" from-port="4" to-layer="15" to-port="0" />
<edge from-layer="13" from-port="0" to-layer="14" to-port="0" />
<edge from-layer="14" from-port="1" to-layer="15" to-port="1" />
<edge from-layer="15" from-port="2" to-layer="17" to-port="0" />
<edge from-layer="16" from-port="0" to-layer="17" to-port="1" />
<edge from-layer="17" from-port="2" to-layer="20" to-port="0" />
<edge from-layer="18" from-port="0" to-layer="19" to-port="0" />
<edge from-layer="19" from-port="1" to-layer="20" to-port="1" />
<edge from-layer="20" from-port="2" to-layer="21" to-port="0" />
<edge from-layer="21" from-port="1" to-layer="24" to-port="0" />
<edge from-layer="22" from-port="0" to-layer="23" to-port="0" />
<edge from-layer="23" from-port="1" to-layer="24" to-port="1" />
<edge from-layer="24" from-port="2" to-layer="26" to-port="0" />
<edge from-layer="25" from-port="0" to-layer="26" to-port="1" />
<edge from-layer="26" from-port="2" to-layer="29" to-port="0" />
<edge from-layer="27" from-port="0" to-layer="28" to-port="0" />
<edge from-layer="28" from-port="1" to-layer="29" to-port="1" />
<edge from-layer="29" from-port="2" to-layer="30" to-port="0" />
<edge from-layer="30" from-port="1" to-layer="31" to-port="0" />
</edges>
<rt_info>
<Runtime_version value="2025.4.0-20398-7a975177ff4-releases/2025/4" />
<conversion_parameters>
<framework value="pytorch" />
<is_python_object value="True" />
</conversion_parameters>
</rt_info>
</net>