promptgen-base-ov / encoder.xml
lieding1994's picture
Upload folder using huggingface_hub
9b3a6a3 verified
<?xml version="1.0"?>
<net name="Model6" version="11">
<layers>
<layer id="1" name="attention_mask" type="Parameter" version="opset1">
<data shape="?,?" element_type="f32" />
<output>
<port id="0" precision="FP32" names="69,attention_mask">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="0" name="inputs_embeds" type="Parameter" version="opset1">
<data shape="?,?,?" element_type="f32" />
<output>
<port id="0" precision="FP32" names="45,46,inputs_embeds">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="2" name="self.model.embed_positions.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1026, 768" offset="0" size="1575936" />
<output>
<port id="0" precision="FP16" names="self.model.embed_positions.weight">
<dim>1026</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="3" name="self.model.embed_positions.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1026</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1026</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="4" name="30" type="Const" version="opset1">
<data element_type="i64" shape="" offset="1575936" size="8" />
<output>
<port id="0" precision="I64" names="30" />
</output>
</layer>
<layer id="5" name="ShapeOf_195276" type="ShapeOf" version="opset3">
<data output_type="i64" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="6" name="Constant_195277" type="Const" version="opset1">
<data element_type="i64" shape="" offset="1575944" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="7" name="Constant_195278" type="Const" version="opset1">
<data element_type="i64" shape="" offset="1575936" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="8" name="Gather_195279" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I64">
<dim>3</dim>
</port>
<port id="1" precision="I64" />
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I64" names="50,52" />
</output>
</layer>
<layer id="9" name="__module.model.embed_positions/aten::arange/Constant" type="Const" version="opset1">
<data element_type="i32" shape="" offset="1575952" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="10" name="__module.model.embed_positions/aten::arange/Range" type="Range" version="opset4">
<data output_type="i64" />
<input>
<port id="0" precision="I64" />
<port id="1" precision="I64" />
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="I64" names="54">
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="11" name="Constant_194996" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="1575956" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="12" name="Add_194053" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="I64">
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="13" name="Constant_194055" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="1575944" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="14" name="Constant_195280" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="1575944" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="15" name="Reshape_195281" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="I64" />
<port id="1" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="16" name="Concat_194056" type="Concat" version="opset1">
<data axis="0" />
<input>
<port id="0" precision="I64">
<dim>1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="17" name="Constant_195285" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="1575936" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="18" name="Constant_195286" type="Const" version="opset1">
<data element_type="i64" shape="" offset="1575936" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="19" name="Gather_195287" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I64">
<dim>3</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I64" names="49">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="20" name="Constant_193833" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="1575944" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="21" name="__module.model.embed_positions/prim::ListConstruct" type="Concat" version="opset1">
<data axis="0" />
<input>
<port id="0" precision="I64">
<dim>1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="22" name="Maximum_194057" type="Maximum" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="I64">
<dim>2</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="23" name="__module.model.embed_positions/aten::add/Add_1" type="Broadcast" version="opset3">
<data mode="numpy" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="2" precision="I64" names="57,input.1">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="24" name="__module.model.embed_positions/aten::embedding/Convert" type="Convert" version="opset1">
<data destination_type="i32" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="25" name="__module.model.embed_positions/aten::embedding/Constant" type="Const" version="opset1">
<data element_type="i32" shape="" offset="1575964" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="26" name="__module.model.embed_positions/aten::embedding/Gather" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="FP32">
<dim>1026</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="FP32" names="58,59,embed_pos,embed_pos.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="27" name="__module.model/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="60,input.3">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="28" name="__module.model.layernorm_embedding/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="29" name="__module.model.layernorm_embedding/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="30" name="Constant_194997_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="1575972" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="31" name="Constant_194997" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="32" name="__module.model.layernorm_embedding/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="33" name="Constant_194998_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="1577508" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="34" name="Constant_194998" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="35" name="__module.model.layernorm_embedding/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="64,input.5">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="36" name="self.model.layers.0.self_attn.q_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="1579044" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.0.self_attn.q_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="37" name="self.model.layers.0.self_attn.q_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="38" name="__module.model.layers.0.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="39" name="Constant_194999_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="2758692" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="40" name="Constant_194999" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="41" name="__module.model.layers.0.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="92,tensor.5">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="42" name="Constant_195366" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="43" name="__module.model.layers.0.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="108">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="44" name="__module.model.layers.0.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="45" name="__module.model.layers.0.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="109">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="46" name="self.model.layers.0.self_attn.k_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="2760276" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.0.self_attn.k_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="47" name="self.model.layers.0.self_attn.k_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="48" name="__module.model.layers.0.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="49" name="Constant_195000_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="3939924" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="50" name="Constant_195000" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="51" name="__module.model.layers.0.self_attn.k_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="95,tensor.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="52" name="Constant_195367" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="53" name="__module.model.layers.0.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="97">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="54" name="__module.model.layers.0.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="55" name="__module.model.layers.0.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="98">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="56" name="self.model.layers.0.self_attn.v_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="3941460" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.0.self_attn.v_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="57" name="self.model.layers.0.self_attn.v_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="58" name="__module.model.layers.0.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="59" name="Constant_195001_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="5121108" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="60" name="Constant_195001" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="61" name="__module.model.layers.0.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="102,tensor.3">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="62" name="Constant_195368" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="63" name="__module.model.layers.0.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="104">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="64" name="__module.model.layers.0.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="65" name="__module.model.layers.0.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="105">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="66" name="Constant_195002_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 1, 1" offset="5122644" size="2" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="67" name="Constant_195002" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="68" name="28" type="Const" version="opset1">
<data element_type="i64" shape="" offset="1575944" size="8" />
<output>
<port id="0" precision="I64" names="28" />
</output>
</layer>
<layer id="69" name="__module.model/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="FP32" names="70">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="70" name="27" type="Const" version="opset1">
<data element_type="i64" shape="" offset="1575956" size="8" />
<output>
<port id="0" precision="I64" names="27" />
</output>
</layer>
<layer id="71" name="__module.model/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="FP32" names="71,72">
<dim>-1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="72" name="Subtract_194127" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="73" name="ShapeOf_194128" type="ShapeOf" version="opset3">
<data output_type="i64" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="74" name="Constant_195295" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="1575936" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="75" name="Constant_195296" type="Const" version="opset1">
<data element_type="i64" shape="" offset="1575936" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="76" name="Gather_195297" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I64">
<dim>4</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I64" names="67">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="77" name="Constant_193839" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="1575944" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="78" name="__module.model/aten::size/ShapeOf" type="ShapeOf" version="opset3">
<data output_type="i64" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="79" name="Constant_193968" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="5122646" size="16" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="80" name="Constant_193969" type="Const" version="opset1">
<data element_type="i64" shape="" offset="1575936" size="8" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="81" name="Gather_193970" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I64">
<dim>2</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="82" name="__module.model/prim::ListConstruct" type="Concat" version="opset1">
<data axis="0" />
<input>
<port id="0" precision="I64">
<dim>1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="3" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="83" name="Maximum_194129" type="Maximum" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="I64">
<dim>4</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="84" name="__module.model/aten::rsub/Subtract" type="Broadcast" version="opset3">
<data mode="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="76,inverted_mask">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="85" name="__module.model/aten::to/Convert_2" type="Convert" version="opset1">
<data destination_type="boolean" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="BOOL" names="77">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="86" name="__module.model/aten::masked_fill/ConvertLike" type="Const" version="opset1">
<data element_type="f32" shape="" offset="5122662" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="87" name="__module.model/aten::masked_fill/Select" type="Select" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="BOOL">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="78,attention_mask_1">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="88" name="__module.model.layers.0.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="111,attn_output.1">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="89" name="__module.model.layers.0.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="90" name="__module.model.layers.0.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="112,attn_output.3">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="91" name="__module.model.layers.0.self_attn/aten::size/ShapeOf" type="ShapeOf" version="opset3">
<data output_type="i64" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="92" name="__module.model.layers.0.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="114,input.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="93" name="self.model.layers.0.self_attn.out_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="5122666" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.0.self_attn.out_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="94" name="self.model.layers.0.self_attn.out_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="95" name="__module.model.layers.0.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="96" name="Constant_195003_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="6302314" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="97" name="Constant_195003" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="98" name="__module.model.layers.0.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="117,input.9">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="99" name="__module.model.layers.0/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="119,input.11">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="100" name="__module.model.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="101" name="__module.model.layers.0.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="102" name="Constant_195004_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="6303850" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="103" name="Constant_195004" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="104" name="__module.model.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="105" name="Constant_195005_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="6305386" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="106" name="Constant_195005" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="107" name="__module.model.layers.0.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="123,input.13">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="108" name="self.model.layers.0.fc1.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="3072, 768" offset="6306922" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.0.fc1.weight">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="109" name="self.model.layers.0.fc1.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="110" name="__module.model.layers.0.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="111" name="Constant_195006_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 3072" offset="11025514" size="6144" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="112" name="Constant_195006" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="113" name="__module.model.layers.0.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="126,input.15">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="114" name="__module.model.layers.0.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="127,input.17">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="115" name="self.model.layers.0.fc2.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 3072" offset="11031658" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.0.fc2.weight">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="116" name="self.model.layers.0.fc2.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="117" name="__module.model.layers.0.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="118" name="Constant_195007_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="15750250" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="119" name="Constant_195007" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="120" name="__module.model.layers.0.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="131,input.21">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="121" name="__module.model.layers.0/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="133,input.23">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="122" name="__module.model.layers.0.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="123" name="__module.model.layers.0.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="124" name="Constant_195008_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="15751786" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="125" name="Constant_195008" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="126" name="__module.model.layers.0.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="127" name="Constant_195009_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="15753322" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="128" name="Constant_195009" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="129" name="__module.model.layers.0.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="137,hidden_states.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="130" name="self.model.layers.1.self_attn.q_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="15754858" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.1.self_attn.q_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="131" name="self.model.layers.1.self_attn.q_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="132" name="__module.model.layers.1.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="133" name="Constant_195010_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="16934506" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="134" name="Constant_195010" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="135" name="__module.model.layers.1.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="151,tensor.11">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="136" name="Constant_195369" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="137" name="__module.model.layers.1.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="167">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="138" name="__module.model.layers.1.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="139" name="__module.model.layers.1.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="168">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="140" name="self.model.layers.1.self_attn.k_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="16936042" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.1.self_attn.k_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="141" name="self.model.layers.1.self_attn.k_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="142" name="__module.model.layers.1.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="143" name="Constant_195011_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="18115690" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="144" name="Constant_195011" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="145" name="__module.model.layers.1.self_attn.k_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="154,tensor.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="146" name="Constant_195370" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="147" name="__module.model.layers.1.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="156">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="148" name="__module.model.layers.1.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="149" name="__module.model.layers.1.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="157">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="150" name="self.model.layers.1.self_attn.v_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="18117226" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.1.self_attn.v_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="151" name="self.model.layers.1.self_attn.v_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="152" name="__module.model.layers.1.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="153" name="Constant_195012_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="19296874" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="154" name="Constant_195012" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="155" name="__module.model.layers.1.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="161,tensor.9">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="156" name="Constant_195371" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="157" name="__module.model.layers.1.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="163">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="158" name="__module.model.layers.1.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="159" name="__module.model.layers.1.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="164">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="160" name="__module.model.layers.1.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="170,attn_output.5">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="161" name="__module.model.layers.1.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="162" name="__module.model.layers.1.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="171,attn_output.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="163" name="__module.model.layers.1.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="173,input.25">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="164" name="self.model.layers.1.self_attn.out_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="19298410" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.1.self_attn.out_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="165" name="self.model.layers.1.self_attn.out_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="166" name="__module.model.layers.1.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="167" name="Constant_195013_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="20478058" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="168" name="Constant_195013" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="169" name="__module.model.layers.1.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="176,input.27">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="170" name="__module.model.layers.1/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="178,input.29">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="171" name="__module.model.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="172" name="__module.model.layers.1.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="173" name="Constant_195014_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="20479594" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="174" name="Constant_195014" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="175" name="__module.model.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="176" name="Constant_195015_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="20481130" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="177" name="Constant_195015" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="178" name="__module.model.layers.1.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="182,input.31">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="179" name="self.model.layers.1.fc1.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="3072, 768" offset="20482666" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.1.fc1.weight">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="180" name="self.model.layers.1.fc1.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="181" name="__module.model.layers.1.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="182" name="Constant_195016_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 3072" offset="25201258" size="6144" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="183" name="Constant_195016" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="184" name="__module.model.layers.1.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="185,input.33">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="185" name="__module.model.layers.1.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="186,input.35">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="186" name="self.model.layers.1.fc2.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 3072" offset="25207402" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.1.fc2.weight">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="187" name="self.model.layers.1.fc2.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="188" name="__module.model.layers.1.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="189" name="Constant_195017_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="29925994" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="190" name="Constant_195017" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="191" name="__module.model.layers.1.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="190,input.39">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="192" name="__module.model.layers.1/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="192,input.41">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="193" name="__module.model.layers.1.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="194" name="__module.model.layers.1.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="195" name="Constant_195018_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="29927530" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="196" name="Constant_195018" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="197" name="__module.model.layers.1.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="198" name="Constant_195019_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="29929066" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="199" name="Constant_195019" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="200" name="__module.model.layers.1.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="196,hidden_states.13">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="201" name="self.model.layers.2.self_attn.q_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="29930602" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.2.self_attn.q_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="202" name="self.model.layers.2.self_attn.q_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="203" name="__module.model.layers.2.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="204" name="Constant_195020_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="31110250" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="205" name="Constant_195020" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="206" name="__module.model.layers.2.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="210,tensor.17">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="207" name="Constant_195372" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="208" name="__module.model.layers.2.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="226">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="209" name="__module.model.layers.2.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="210" name="__module.model.layers.2.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="227">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="211" name="self.model.layers.2.self_attn.k_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="31111786" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.2.self_attn.k_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="212" name="self.model.layers.2.self_attn.k_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="213" name="__module.model.layers.2.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="214" name="Constant_195021_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="32291434" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="215" name="Constant_195021" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="216" name="__module.model.layers.2.self_attn.k_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="213,tensor.13">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="217" name="Constant_195373" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="218" name="__module.model.layers.2.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="215">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="219" name="__module.model.layers.2.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="220" name="__module.model.layers.2.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="216">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="221" name="self.model.layers.2.self_attn.v_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="32292970" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.2.self_attn.v_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="222" name="self.model.layers.2.self_attn.v_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="223" name="__module.model.layers.2.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="224" name="Constant_195022_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="33472618" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="225" name="Constant_195022" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="226" name="__module.model.layers.2.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="220,tensor.15">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="227" name="Constant_195374" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="228" name="__module.model.layers.2.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="222">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="229" name="__module.model.layers.2.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="230" name="__module.model.layers.2.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="223">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="231" name="__module.model.layers.2.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="229,attn_output.9">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="232" name="__module.model.layers.2.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="233" name="__module.model.layers.2.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="230,attn_output.11">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="234" name="__module.model.layers.2.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="232,input.43">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="235" name="self.model.layers.2.self_attn.out_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="33474154" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.2.self_attn.out_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="236" name="self.model.layers.2.self_attn.out_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="237" name="__module.model.layers.2.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="238" name="Constant_195023_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="34653802" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="239" name="Constant_195023" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="240" name="__module.model.layers.2.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="235,input.45">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="241" name="__module.model.layers.2/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="237,input.47">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="242" name="__module.model.layers.2.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="243" name="__module.model.layers.2.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="244" name="Constant_195024_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="34655338" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="245" name="Constant_195024" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="246" name="__module.model.layers.2.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="247" name="Constant_195025_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="34656874" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="248" name="Constant_195025" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="249" name="__module.model.layers.2.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="241,input.49">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="250" name="self.model.layers.2.fc1.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="3072, 768" offset="34658410" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.2.fc1.weight">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="251" name="self.model.layers.2.fc1.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="252" name="__module.model.layers.2.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="253" name="Constant_195026_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 3072" offset="39377002" size="6144" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="254" name="Constant_195026" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="255" name="__module.model.layers.2.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="244,input.51">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="256" name="__module.model.layers.2.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="245,input.53">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="257" name="self.model.layers.2.fc2.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 3072" offset="39383146" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.2.fc2.weight">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="258" name="self.model.layers.2.fc2.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="259" name="__module.model.layers.2.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="260" name="Constant_195027_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="44101738" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="261" name="Constant_195027" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="262" name="__module.model.layers.2.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="249,input.57">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="263" name="__module.model.layers.2/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="251,input.59">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="264" name="__module.model.layers.2.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="265" name="__module.model.layers.2.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="266" name="Constant_195028_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="44103274" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="267" name="Constant_195028" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="268" name="__module.model.layers.2.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="269" name="Constant_195029_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="44104810" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="270" name="Constant_195029" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="271" name="__module.model.layers.2.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="255,hidden_states.19">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="272" name="self.model.layers.3.self_attn.q_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="44106346" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.3.self_attn.q_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="273" name="self.model.layers.3.self_attn.q_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="274" name="__module.model.layers.3.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="275" name="Constant_195030_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="45285994" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="276" name="Constant_195030" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="277" name="__module.model.layers.3.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="269,tensor.23">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="278" name="Constant_195375" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="279" name="__module.model.layers.3.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="285">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="280" name="__module.model.layers.3.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="281" name="__module.model.layers.3.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="286">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="282" name="self.model.layers.3.self_attn.k_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="45287530" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.3.self_attn.k_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="283" name="self.model.layers.3.self_attn.k_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="284" name="__module.model.layers.3.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="285" name="Constant_195031_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="46467178" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="286" name="Constant_195031" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="287" name="__module.model.layers.3.self_attn.k_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="272,tensor.19">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="288" name="Constant_195376" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="289" name="__module.model.layers.3.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="274">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="290" name="__module.model.layers.3.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="291" name="__module.model.layers.3.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="275">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="292" name="self.model.layers.3.self_attn.v_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="46468714" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.3.self_attn.v_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="293" name="self.model.layers.3.self_attn.v_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="294" name="__module.model.layers.3.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="295" name="Constant_195032_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="47648362" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="296" name="Constant_195032" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="297" name="__module.model.layers.3.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="279,tensor.21">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="298" name="Constant_195377" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="299" name="__module.model.layers.3.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="281">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="300" name="__module.model.layers.3.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="301" name="__module.model.layers.3.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="282">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="302" name="__module.model.layers.3.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="288,attn_output.13">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="303" name="__module.model.layers.3.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="304" name="__module.model.layers.3.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="289,attn_output.15">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="305" name="__module.model.layers.3.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="291,input.61">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="306" name="self.model.layers.3.self_attn.out_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="47649898" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.3.self_attn.out_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="307" name="self.model.layers.3.self_attn.out_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="308" name="__module.model.layers.3.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="309" name="Constant_195033_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="48829546" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="310" name="Constant_195033" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="311" name="__module.model.layers.3.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="294,input.63">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="312" name="__module.model.layers.3/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="296,input.65">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="313" name="__module.model.layers.3.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="314" name="__module.model.layers.3.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="315" name="Constant_195034_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="48831082" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="316" name="Constant_195034" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="317" name="__module.model.layers.3.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="318" name="Constant_195035_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="48832618" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="319" name="Constant_195035" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="320" name="__module.model.layers.3.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="300,input.67">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="321" name="self.model.layers.3.fc1.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="3072, 768" offset="48834154" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.3.fc1.weight">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="322" name="self.model.layers.3.fc1.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="323" name="__module.model.layers.3.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="324" name="Constant_195036_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 3072" offset="53552746" size="6144" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="325" name="Constant_195036" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="326" name="__module.model.layers.3.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="303,input.69">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="327" name="__module.model.layers.3.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="304,input.71">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="328" name="self.model.layers.3.fc2.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 3072" offset="53558890" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.3.fc2.weight">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="329" name="self.model.layers.3.fc2.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="330" name="__module.model.layers.3.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="331" name="Constant_195037_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="58277482" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="332" name="Constant_195037" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="333" name="__module.model.layers.3.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="308,input.75">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="334" name="__module.model.layers.3/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="310,input.77">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="335" name="__module.model.layers.3.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="336" name="__module.model.layers.3.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="337" name="Constant_195038_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="58279018" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="338" name="Constant_195038" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="339" name="__module.model.layers.3.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="340" name="Constant_195039_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="58280554" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="341" name="Constant_195039" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="342" name="__module.model.layers.3.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="314,hidden_states.25">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="343" name="self.model.layers.4.self_attn.q_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="58282090" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.4.self_attn.q_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="344" name="self.model.layers.4.self_attn.q_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="345" name="__module.model.layers.4.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="346" name="Constant_195040_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="59461738" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="347" name="Constant_195040" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="348" name="__module.model.layers.4.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="328,tensor.29">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="349" name="Constant_195378" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="350" name="__module.model.layers.4.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="344">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="351" name="__module.model.layers.4.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="352" name="__module.model.layers.4.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="345">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="353" name="self.model.layers.4.self_attn.k_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="59463274" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.4.self_attn.k_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="354" name="self.model.layers.4.self_attn.k_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="355" name="__module.model.layers.4.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="356" name="Constant_195041_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="60642922" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="357" name="Constant_195041" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="358" name="__module.model.layers.4.self_attn.k_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="331,tensor.25">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="359" name="Constant_195379" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="360" name="__module.model.layers.4.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="333">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="361" name="__module.model.layers.4.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="362" name="__module.model.layers.4.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="334">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="363" name="self.model.layers.4.self_attn.v_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="60644458" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.4.self_attn.v_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="364" name="self.model.layers.4.self_attn.v_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="365" name="__module.model.layers.4.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="366" name="Constant_195042_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="61824106" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="367" name="Constant_195042" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="368" name="__module.model.layers.4.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="338,tensor.27">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="369" name="Constant_195380" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="370" name="__module.model.layers.4.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="340">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="371" name="__module.model.layers.4.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="372" name="__module.model.layers.4.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="341">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="373" name="__module.model.layers.4.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="347,attn_output.17">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="374" name="__module.model.layers.4.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="375" name="__module.model.layers.4.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="348,attn_output.19">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="376" name="__module.model.layers.4.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="350,input.79">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="377" name="self.model.layers.4.self_attn.out_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="61825642" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.4.self_attn.out_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="378" name="self.model.layers.4.self_attn.out_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="379" name="__module.model.layers.4.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="380" name="Constant_195043_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="63005290" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="381" name="Constant_195043" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="382" name="__module.model.layers.4.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="353,input.81">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="383" name="__module.model.layers.4/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="355,input.83">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="384" name="__module.model.layers.4.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="385" name="__module.model.layers.4.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="386" name="Constant_195044_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="63006826" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="387" name="Constant_195044" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="388" name="__module.model.layers.4.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="389" name="Constant_195045_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="63008362" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="390" name="Constant_195045" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="391" name="__module.model.layers.4.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="359,input.85">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="392" name="self.model.layers.4.fc1.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="3072, 768" offset="63009898" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.4.fc1.weight">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="393" name="self.model.layers.4.fc1.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="394" name="__module.model.layers.4.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="395" name="Constant_195046_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 3072" offset="67728490" size="6144" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="396" name="Constant_195046" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="397" name="__module.model.layers.4.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="362,input.87">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="398" name="__module.model.layers.4.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="363,input.89">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="399" name="self.model.layers.4.fc2.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 3072" offset="67734634" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.4.fc2.weight">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="400" name="self.model.layers.4.fc2.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="401" name="__module.model.layers.4.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="402" name="Constant_195047_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="72453226" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="403" name="Constant_195047" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="404" name="__module.model.layers.4.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="367,input.93">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="405" name="__module.model.layers.4/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="369,input.95">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="406" name="__module.model.layers.4.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="407" name="__module.model.layers.4.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="408" name="Constant_195048_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="72454762" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="409" name="Constant_195048" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="410" name="__module.model.layers.4.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="411" name="Constant_195049_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="72456298" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="412" name="Constant_195049" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="413" name="__module.model.layers.4.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="373,hidden_states.31">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="414" name="self.model.layers.5.self_attn.q_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="72457834" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.5.self_attn.q_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="415" name="self.model.layers.5.self_attn.q_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="416" name="__module.model.layers.5.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="417" name="Constant_195050_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="73637482" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="418" name="Constant_195050" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="419" name="__module.model.layers.5.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="387,tensor">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="420" name="Constant_195381" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="421" name="__module.model.layers.5.self_attn/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="403">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="422" name="__module.model.layers.5.self_attn/aten::transpose/Constant" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="423" name="__module.model.layers.5.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="404">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="424" name="self.model.layers.5.self_attn.k_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="73639018" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.5.self_attn.k_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="425" name="self.model.layers.5.self_attn.k_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="426" name="__module.model.layers.5.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="427" name="Constant_195051_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="74818666" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="428" name="Constant_195051" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="429" name="__module.model.layers.5.self_attn.k_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="390,tensor.31">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="430" name="Constant_195382" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="431" name="__module.model.layers.5.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="392">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="432" name="__module.model.layers.5.self_attn/aten::transpose/Constant_1" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="433" name="__module.model.layers.5.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="393">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="434" name="self.model.layers.5.self_attn.v_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="74820202" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.5.self_attn.v_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="435" name="self.model.layers.5.self_attn.v_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="436" name="__module.model.layers.5.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="437" name="Constant_195052_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="75999850" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="438" name="Constant_195052" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="439" name="__module.model.layers.5.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="397,tensor.33">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="440" name="Constant_195383" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="2760228" size="32" />
<rt_info>
<attribute name="precise" version="0" />
</rt_info>
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="441" name="__module.model.layers.5.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="399">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="442" name="__module.model.layers.5.self_attn/aten::transpose/Constant_2" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="443" name="__module.model.layers.5.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="400">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="444" name="__module.model.layers.5.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="406,attn_output.21">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="445" name="__module.model.layers.5.self_attn/aten::transpose/Constant_3" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="2760260" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="446" name="__module.model.layers.5.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>64</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="407,attn_output">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
</output>
</layer>
<layer id="447" name="__module.model.layers.5.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>64</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="409,input.97">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="448" name="self.model.layers.5.self_attn.out_proj.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 768" offset="76001386" size="1179648" />
<output>
<port id="0" precision="FP16" names="self.model.layers.5.self_attn.out_proj.weight">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="449" name="self.model.layers.5.self_attn.out_proj.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="450" name="__module.model.layers.5.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="451" name="Constant_195053_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="77181034" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="452" name="Constant_195053" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="453" name="__module.model.layers.5.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="412,input.99">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="454" name="__module.model.layers.5/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="414,input.101">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="455" name="__module.model.layers.5.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="456" name="__module.model.layers.5.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="457" name="Constant_195054_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="77182570" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="458" name="Constant_195054" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="459" name="__module.model.layers.5.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="460" name="Constant_195055_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="77184106" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="461" name="Constant_195055" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="462" name="__module.model.layers.5.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="418,input.103">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="463" name="self.model.layers.5.fc1.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="3072, 768" offset="77185642" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.5.fc1.weight">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="464" name="self.model.layers.5.fc1.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="465" name="__module.model.layers.5.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>3072</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="466" name="Constant_195056_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 3072" offset="81904234" size="6144" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="467" name="Constant_195056" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="468" name="__module.model.layers.5.fc1/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="421,input.105">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="469" name="__module.model.layers.5.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="422,input.107">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="470" name="self.model.layers.5.fc2.weight_compressed" type="Const" version="opset1">
<data element_type="f16" shape="768, 3072" offset="81910378" size="4718592" />
<output>
<port id="0" precision="FP16" names="self.model.layers.5.fc2.weight">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="471" name="self.model.layers.5.fc2.weight" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</output>
</layer>
<layer id="472" name="__module.model.layers.5.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>3072</dim>
</port>
<port id="1" precision="FP32">
<dim>768</dim>
<dim>3072</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="473" name="Constant_195057_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="86628970" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="474" name="Constant_195057" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="475" name="__module.model.layers.5.fc2/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="426,input.111">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="476" name="__module.model.layers.5/aten::add/Add_1" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="428,input">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="477" name="__module.model.layers.5.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="1575968" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="478" name="__module.model.layers.5.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="479" name="Constant_195058_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="86630506" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="480" name="Constant_195058" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="481" name="__module.model.layers.5.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="482" name="Constant_195059_compressed" type="Const" version="opset1">
<data element_type="f16" shape="1, 1, 768" offset="86632042" size="1536" />
<output>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="483" name="Constant_195059" type="Convert" version="opset1">
<data destination_type="f32" />
<rt_info>
<attribute name="decompression" version="0" />
</rt_info>
<input>
<port id="0" precision="FP16">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="484" name="__module.model.layers.5.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>768</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="last_hidden_state">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</output>
</layer>
<layer id="485" name="Result_190330" type="Result" version="opset1" output_names="last_hidden_state">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>768</dim>
</port>
</input>
</layer>
</layers>
<edges>
<edge from-layer="0" from-port="0" to-layer="5" to-port="0" />
<edge from-layer="0" from-port="0" to-layer="27" to-port="0" />
<edge from-layer="1" from-port="0" to-layer="78" to-port="0" />
<edge from-layer="1" from-port="0" to-layer="69" to-port="0" />
<edge from-layer="2" from-port="0" to-layer="3" to-port="0" />
<edge from-layer="3" from-port="1" to-layer="26" to-port="0" />
<edge from-layer="4" from-port="0" to-layer="10" to-port="0" />
<edge from-layer="5" from-port="1" to-layer="19" to-port="0" />
<edge from-layer="5" from-port="1" to-layer="8" to-port="0" />
<edge from-layer="6" from-port="0" to-layer="8" to-port="1" />
<edge from-layer="7" from-port="0" to-layer="8" to-port="2" />
<edge from-layer="8" from-port="3" to-layer="10" to-port="1" />
<edge from-layer="8" from-port="3" to-layer="15" to-port="0" />
<edge from-layer="9" from-port="0" to-layer="10" to-port="2" />
<edge from-layer="10" from-port="3" to-layer="12" to-port="0" />
<edge from-layer="11" from-port="0" to-layer="12" to-port="1" />
<edge from-layer="12" from-port="2" to-layer="23" to-port="0" />
<edge from-layer="13" from-port="0" to-layer="16" to-port="0" />
<edge from-layer="14" from-port="0" to-layer="15" to-port="1" />
<edge from-layer="15" from-port="2" to-layer="16" to-port="1" />
<edge from-layer="16" from-port="2" to-layer="22" to-port="0" />
<edge from-layer="17" from-port="0" to-layer="19" to-port="1" />
<edge from-layer="18" from-port="0" to-layer="19" to-port="2" />
<edge from-layer="19" from-port="3" to-layer="21" to-port="0" />
<edge from-layer="20" from-port="0" to-layer="21" to-port="1" />
<edge from-layer="21" from-port="2" to-layer="22" to-port="1" />
<edge from-layer="22" from-port="2" to-layer="23" to-port="1" />
<edge from-layer="23" from-port="2" to-layer="24" to-port="0" />
<edge from-layer="24" from-port="1" to-layer="26" to-port="1" />
<edge from-layer="25" from-port="0" to-layer="26" to-port="2" />
<edge from-layer="26" from-port="3" to-layer="27" to-port="1" />
<edge from-layer="27" from-port="2" to-layer="29" to-port="0" />
<edge from-layer="28" from-port="0" to-layer="29" to-port="1" />
<edge from-layer="29" from-port="2" to-layer="32" to-port="0" />
<edge from-layer="30" from-port="0" to-layer="31" to-port="0" />
<edge from-layer="31" from-port="1" to-layer="32" to-port="1" />
<edge from-layer="32" from-port="2" to-layer="35" to-port="0" />
<edge from-layer="33" from-port="0" to-layer="34" to-port="0" />
<edge from-layer="34" from-port="1" to-layer="35" to-port="1" />
<edge from-layer="35" from-port="2" to-layer="91" to-port="0" />
<edge from-layer="35" from-port="2" to-layer="99" to-port="0" />
<edge from-layer="35" from-port="2" to-layer="58" to-port="0" />
<edge from-layer="35" from-port="2" to-layer="48" to-port="0" />
<edge from-layer="35" from-port="2" to-layer="38" to-port="0" />
<edge from-layer="36" from-port="0" to-layer="37" to-port="0" />
<edge from-layer="37" from-port="1" to-layer="38" to-port="1" />
<edge from-layer="38" from-port="2" to-layer="41" to-port="0" />
<edge from-layer="39" from-port="0" to-layer="40" to-port="0" />
<edge from-layer="40" from-port="1" to-layer="41" to-port="1" />
<edge from-layer="41" from-port="2" to-layer="43" to-port="0" />
<edge from-layer="42" from-port="0" to-layer="43" to-port="1" />
<edge from-layer="43" from-port="2" to-layer="45" to-port="0" />
<edge from-layer="44" from-port="0" to-layer="45" to-port="1" />
<edge from-layer="45" from-port="2" to-layer="88" to-port="0" />
<edge from-layer="46" from-port="0" to-layer="47" to-port="0" />
<edge from-layer="47" from-port="1" to-layer="48" to-port="1" />
<edge from-layer="48" from-port="2" to-layer="51" to-port="0" />
<edge from-layer="49" from-port="0" to-layer="50" to-port="0" />
<edge from-layer="50" from-port="1" to-layer="51" to-port="1" />
<edge from-layer="51" from-port="2" to-layer="53" to-port="0" />
<edge from-layer="52" from-port="0" to-layer="53" to-port="1" />
<edge from-layer="53" from-port="2" to-layer="55" to-port="0" />
<edge from-layer="54" from-port="0" to-layer="55" to-port="1" />
<edge from-layer="55" from-port="2" to-layer="88" to-port="1" />
<edge from-layer="56" from-port="0" to-layer="57" to-port="0" />
<edge from-layer="57" from-port="1" to-layer="58" to-port="1" />
<edge from-layer="58" from-port="2" to-layer="61" to-port="0" />
<edge from-layer="59" from-port="0" to-layer="60" to-port="0" />
<edge from-layer="60" from-port="1" to-layer="61" to-port="1" />
<edge from-layer="61" from-port="2" to-layer="63" to-port="0" />
<edge from-layer="62" from-port="0" to-layer="63" to-port="1" />
<edge from-layer="63" from-port="2" to-layer="65" to-port="0" />
<edge from-layer="64" from-port="0" to-layer="65" to-port="1" />
<edge from-layer="65" from-port="2" to-layer="88" to-port="2" />
<edge from-layer="66" from-port="0" to-layer="67" to-port="0" />
<edge from-layer="67" from-port="1" to-layer="72" to-port="0" />
<edge from-layer="68" from-port="0" to-layer="69" to-port="1" />
<edge from-layer="69" from-port="2" to-layer="71" to-port="0" />
<edge from-layer="70" from-port="0" to-layer="71" to-port="1" />
<edge from-layer="71" from-port="2" to-layer="72" to-port="1" />
<edge from-layer="72" from-port="2" to-layer="73" to-port="0" />
<edge from-layer="72" from-port="2" to-layer="84" to-port="0" />
<edge from-layer="73" from-port="1" to-layer="76" to-port="0" />
<edge from-layer="73" from-port="1" to-layer="83" to-port="0" />
<edge from-layer="74" from-port="0" to-layer="76" to-port="1" />
<edge from-layer="75" from-port="0" to-layer="76" to-port="2" />
<edge from-layer="76" from-port="3" to-layer="82" to-port="0" />
<edge from-layer="77" from-port="0" to-layer="82" to-port="1" />
<edge from-layer="78" from-port="1" to-layer="81" to-port="0" />
<edge from-layer="79" from-port="0" to-layer="81" to-port="1" />
<edge from-layer="80" from-port="0" to-layer="81" to-port="2" />
<edge from-layer="81" from-port="3" to-layer="82" to-port="2" />
<edge from-layer="82" from-port="3" to-layer="83" to-port="1" />
<edge from-layer="83" from-port="2" to-layer="84" to-port="1" />
<edge from-layer="84" from-port="2" to-layer="87" to-port="2" />
<edge from-layer="84" from-port="2" to-layer="85" to-port="0" />
<edge from-layer="85" from-port="1" to-layer="87" to-port="0" />
<edge from-layer="86" from-port="0" to-layer="87" to-port="1" />
<edge from-layer="87" from-port="3" to-layer="444" to-port="3" />
<edge from-layer="87" from-port="3" to-layer="373" to-port="3" />
<edge from-layer="87" from-port="3" to-layer="231" to-port="3" />
<edge from-layer="87" from-port="3" to-layer="160" to-port="3" />
<edge from-layer="87" from-port="3" to-layer="302" to-port="3" />
<edge from-layer="87" from-port="3" to-layer="88" to-port="3" />
<edge from-layer="88" from-port="4" to-layer="90" to-port="0" />
<edge from-layer="89" from-port="0" to-layer="90" to-port="1" />
<edge from-layer="90" from-port="2" to-layer="92" to-port="0" />
<edge from-layer="91" from-port="1" to-layer="234" to-port="1" />
<edge from-layer="91" from-port="1" to-layer="447" to-port="1" />
<edge from-layer="91" from-port="1" to-layer="376" to-port="1" />
<edge from-layer="91" from-port="1" to-layer="305" to-port="1" />
<edge from-layer="91" from-port="1" to-layer="163" to-port="1" />
<edge from-layer="91" from-port="1" to-layer="92" to-port="1" />
<edge from-layer="92" from-port="2" to-layer="95" to-port="0" />
<edge from-layer="93" from-port="0" to-layer="94" to-port="0" />
<edge from-layer="94" from-port="1" to-layer="95" to-port="1" />
<edge from-layer="95" from-port="2" to-layer="98" to-port="0" />
<edge from-layer="96" from-port="0" to-layer="97" to-port="0" />
<edge from-layer="97" from-port="1" to-layer="98" to-port="1" />
<edge from-layer="98" from-port="2" to-layer="99" to-port="1" />
<edge from-layer="99" from-port="2" to-layer="101" to-port="0" />
<edge from-layer="100" from-port="0" to-layer="101" to-port="1" />
<edge from-layer="101" from-port="2" to-layer="104" to-port="0" />
<edge from-layer="102" from-port="0" to-layer="103" to-port="0" />
<edge from-layer="103" from-port="1" to-layer="104" to-port="1" />
<edge from-layer="104" from-port="2" to-layer="107" to-port="0" />
<edge from-layer="105" from-port="0" to-layer="106" to-port="0" />
<edge from-layer="106" from-port="1" to-layer="107" to-port="1" />
<edge from-layer="107" from-port="2" to-layer="110" to-port="0" />
<edge from-layer="107" from-port="2" to-layer="121" to-port="0" />
<edge from-layer="108" from-port="0" to-layer="109" to-port="0" />
<edge from-layer="109" from-port="1" to-layer="110" to-port="1" />
<edge from-layer="110" from-port="2" to-layer="113" to-port="0" />
<edge from-layer="111" from-port="0" to-layer="112" to-port="0" />
<edge from-layer="112" from-port="1" to-layer="113" to-port="1" />
<edge from-layer="113" from-port="2" to-layer="114" to-port="0" />
<edge from-layer="114" from-port="1" to-layer="117" to-port="0" />
<edge from-layer="115" from-port="0" to-layer="116" to-port="0" />
<edge from-layer="116" from-port="1" to-layer="117" to-port="1" />
<edge from-layer="117" from-port="2" to-layer="120" to-port="0" />
<edge from-layer="118" from-port="0" to-layer="119" to-port="0" />
<edge from-layer="119" from-port="1" to-layer="120" to-port="1" />
<edge from-layer="120" from-port="2" to-layer="121" to-port="1" />
<edge from-layer="121" from-port="2" to-layer="123" to-port="0" />
<edge from-layer="122" from-port="0" to-layer="123" to-port="1" />
<edge from-layer="123" from-port="2" to-layer="126" to-port="0" />
<edge from-layer="124" from-port="0" to-layer="125" to-port="0" />
<edge from-layer="125" from-port="1" to-layer="126" to-port="1" />
<edge from-layer="126" from-port="2" to-layer="129" to-port="0" />
<edge from-layer="127" from-port="0" to-layer="128" to-port="0" />
<edge from-layer="128" from-port="1" to-layer="129" to-port="1" />
<edge from-layer="129" from-port="2" to-layer="170" to-port="0" />
<edge from-layer="129" from-port="2" to-layer="152" to-port="0" />
<edge from-layer="129" from-port="2" to-layer="132" to-port="0" />
<edge from-layer="129" from-port="2" to-layer="142" to-port="0" />
<edge from-layer="130" from-port="0" to-layer="131" to-port="0" />
<edge from-layer="131" from-port="1" to-layer="132" to-port="1" />
<edge from-layer="132" from-port="2" to-layer="135" to-port="0" />
<edge from-layer="133" from-port="0" to-layer="134" to-port="0" />
<edge from-layer="134" from-port="1" to-layer="135" to-port="1" />
<edge from-layer="135" from-port="2" to-layer="137" to-port="0" />
<edge from-layer="136" from-port="0" to-layer="137" to-port="1" />
<edge from-layer="137" from-port="2" to-layer="139" to-port="0" />
<edge from-layer="138" from-port="0" to-layer="139" to-port="1" />
<edge from-layer="139" from-port="2" to-layer="160" to-port="0" />
<edge from-layer="140" from-port="0" to-layer="141" to-port="0" />
<edge from-layer="141" from-port="1" to-layer="142" to-port="1" />
<edge from-layer="142" from-port="2" to-layer="145" to-port="0" />
<edge from-layer="143" from-port="0" to-layer="144" to-port="0" />
<edge from-layer="144" from-port="1" to-layer="145" to-port="1" />
<edge from-layer="145" from-port="2" to-layer="147" to-port="0" />
<edge from-layer="146" from-port="0" to-layer="147" to-port="1" />
<edge from-layer="147" from-port="2" to-layer="149" to-port="0" />
<edge from-layer="148" from-port="0" to-layer="149" to-port="1" />
<edge from-layer="149" from-port="2" to-layer="160" to-port="1" />
<edge from-layer="150" from-port="0" to-layer="151" to-port="0" />
<edge from-layer="151" from-port="1" to-layer="152" to-port="1" />
<edge from-layer="152" from-port="2" to-layer="155" to-port="0" />
<edge from-layer="153" from-port="0" to-layer="154" to-port="0" />
<edge from-layer="154" from-port="1" to-layer="155" to-port="1" />
<edge from-layer="155" from-port="2" to-layer="157" to-port="0" />
<edge from-layer="156" from-port="0" to-layer="157" to-port="1" />
<edge from-layer="157" from-port="2" to-layer="159" to-port="0" />
<edge from-layer="158" from-port="0" to-layer="159" to-port="1" />
<edge from-layer="159" from-port="2" to-layer="160" to-port="2" />
<edge from-layer="160" from-port="4" to-layer="162" to-port="0" />
<edge from-layer="161" from-port="0" to-layer="162" to-port="1" />
<edge from-layer="162" from-port="2" to-layer="163" to-port="0" />
<edge from-layer="163" from-port="2" to-layer="166" to-port="0" />
<edge from-layer="164" from-port="0" to-layer="165" to-port="0" />
<edge from-layer="165" from-port="1" to-layer="166" to-port="1" />
<edge from-layer="166" from-port="2" to-layer="169" to-port="0" />
<edge from-layer="167" from-port="0" to-layer="168" to-port="0" />
<edge from-layer="168" from-port="1" to-layer="169" to-port="1" />
<edge from-layer="169" from-port="2" to-layer="170" to-port="1" />
<edge from-layer="170" from-port="2" to-layer="172" to-port="0" />
<edge from-layer="171" from-port="0" to-layer="172" to-port="1" />
<edge from-layer="172" from-port="2" to-layer="175" to-port="0" />
<edge from-layer="173" from-port="0" to-layer="174" to-port="0" />
<edge from-layer="174" from-port="1" to-layer="175" to-port="1" />
<edge from-layer="175" from-port="2" to-layer="178" to-port="0" />
<edge from-layer="176" from-port="0" to-layer="177" to-port="0" />
<edge from-layer="177" from-port="1" to-layer="178" to-port="1" />
<edge from-layer="178" from-port="2" to-layer="181" to-port="0" />
<edge from-layer="178" from-port="2" to-layer="192" to-port="0" />
<edge from-layer="179" from-port="0" to-layer="180" to-port="0" />
<edge from-layer="180" from-port="1" to-layer="181" to-port="1" />
<edge from-layer="181" from-port="2" to-layer="184" to-port="0" />
<edge from-layer="182" from-port="0" to-layer="183" to-port="0" />
<edge from-layer="183" from-port="1" to-layer="184" to-port="1" />
<edge from-layer="184" from-port="2" to-layer="185" to-port="0" />
<edge from-layer="185" from-port="1" to-layer="188" to-port="0" />
<edge from-layer="186" from-port="0" to-layer="187" to-port="0" />
<edge from-layer="187" from-port="1" to-layer="188" to-port="1" />
<edge from-layer="188" from-port="2" to-layer="191" to-port="0" />
<edge from-layer="189" from-port="0" to-layer="190" to-port="0" />
<edge from-layer="190" from-port="1" to-layer="191" to-port="1" />
<edge from-layer="191" from-port="2" to-layer="192" to-port="1" />
<edge from-layer="192" from-port="2" to-layer="194" to-port="0" />
<edge from-layer="193" from-port="0" to-layer="194" to-port="1" />
<edge from-layer="194" from-port="2" to-layer="197" to-port="0" />
<edge from-layer="195" from-port="0" to-layer="196" to-port="0" />
<edge from-layer="196" from-port="1" to-layer="197" to-port="1" />
<edge from-layer="197" from-port="2" to-layer="200" to-port="0" />
<edge from-layer="198" from-port="0" to-layer="199" to-port="0" />
<edge from-layer="199" from-port="1" to-layer="200" to-port="1" />
<edge from-layer="200" from-port="2" to-layer="241" to-port="0" />
<edge from-layer="200" from-port="2" to-layer="223" to-port="0" />
<edge from-layer="200" from-port="2" to-layer="203" to-port="0" />
<edge from-layer="200" from-port="2" to-layer="213" to-port="0" />
<edge from-layer="201" from-port="0" to-layer="202" to-port="0" />
<edge from-layer="202" from-port="1" to-layer="203" to-port="1" />
<edge from-layer="203" from-port="2" to-layer="206" to-port="0" />
<edge from-layer="204" from-port="0" to-layer="205" to-port="0" />
<edge from-layer="205" from-port="1" to-layer="206" to-port="1" />
<edge from-layer="206" from-port="2" to-layer="208" to-port="0" />
<edge from-layer="207" from-port="0" to-layer="208" to-port="1" />
<edge from-layer="208" from-port="2" to-layer="210" to-port="0" />
<edge from-layer="209" from-port="0" to-layer="210" to-port="1" />
<edge from-layer="210" from-port="2" to-layer="231" to-port="0" />
<edge from-layer="211" from-port="0" to-layer="212" to-port="0" />
<edge from-layer="212" from-port="1" to-layer="213" to-port="1" />
<edge from-layer="213" from-port="2" to-layer="216" to-port="0" />
<edge from-layer="214" from-port="0" to-layer="215" to-port="0" />
<edge from-layer="215" from-port="1" to-layer="216" to-port="1" />
<edge from-layer="216" from-port="2" to-layer="218" to-port="0" />
<edge from-layer="217" from-port="0" to-layer="218" to-port="1" />
<edge from-layer="218" from-port="2" to-layer="220" to-port="0" />
<edge from-layer="219" from-port="0" to-layer="220" to-port="1" />
<edge from-layer="220" from-port="2" to-layer="231" to-port="1" />
<edge from-layer="221" from-port="0" to-layer="222" to-port="0" />
<edge from-layer="222" from-port="1" to-layer="223" to-port="1" />
<edge from-layer="223" from-port="2" to-layer="226" to-port="0" />
<edge from-layer="224" from-port="0" to-layer="225" to-port="0" />
<edge from-layer="225" from-port="1" to-layer="226" to-port="1" />
<edge from-layer="226" from-port="2" to-layer="228" to-port="0" />
<edge from-layer="227" from-port="0" to-layer="228" to-port="1" />
<edge from-layer="228" from-port="2" to-layer="230" to-port="0" />
<edge from-layer="229" from-port="0" to-layer="230" to-port="1" />
<edge from-layer="230" from-port="2" to-layer="231" to-port="2" />
<edge from-layer="231" from-port="4" to-layer="233" to-port="0" />
<edge from-layer="232" from-port="0" to-layer="233" to-port="1" />
<edge from-layer="233" from-port="2" to-layer="234" to-port="0" />
<edge from-layer="234" from-port="2" to-layer="237" to-port="0" />
<edge from-layer="235" from-port="0" to-layer="236" to-port="0" />
<edge from-layer="236" from-port="1" to-layer="237" to-port="1" />
<edge from-layer="237" from-port="2" to-layer="240" to-port="0" />
<edge from-layer="238" from-port="0" to-layer="239" to-port="0" />
<edge from-layer="239" from-port="1" to-layer="240" to-port="1" />
<edge from-layer="240" from-port="2" to-layer="241" to-port="1" />
<edge from-layer="241" from-port="2" to-layer="243" to-port="0" />
<edge from-layer="242" from-port="0" to-layer="243" to-port="1" />
<edge from-layer="243" from-port="2" to-layer="246" to-port="0" />
<edge from-layer="244" from-port="0" to-layer="245" to-port="0" />
<edge from-layer="245" from-port="1" to-layer="246" to-port="1" />
<edge from-layer="246" from-port="2" to-layer="249" to-port="0" />
<edge from-layer="247" from-port="0" to-layer="248" to-port="0" />
<edge from-layer="248" from-port="1" to-layer="249" to-port="1" />
<edge from-layer="249" from-port="2" to-layer="252" to-port="0" />
<edge from-layer="249" from-port="2" to-layer="263" to-port="0" />
<edge from-layer="250" from-port="0" to-layer="251" to-port="0" />
<edge from-layer="251" from-port="1" to-layer="252" to-port="1" />
<edge from-layer="252" from-port="2" to-layer="255" to-port="0" />
<edge from-layer="253" from-port="0" to-layer="254" to-port="0" />
<edge from-layer="254" from-port="1" to-layer="255" to-port="1" />
<edge from-layer="255" from-port="2" to-layer="256" to-port="0" />
<edge from-layer="256" from-port="1" to-layer="259" to-port="0" />
<edge from-layer="257" from-port="0" to-layer="258" to-port="0" />
<edge from-layer="258" from-port="1" to-layer="259" to-port="1" />
<edge from-layer="259" from-port="2" to-layer="262" to-port="0" />
<edge from-layer="260" from-port="0" to-layer="261" to-port="0" />
<edge from-layer="261" from-port="1" to-layer="262" to-port="1" />
<edge from-layer="262" from-port="2" to-layer="263" to-port="1" />
<edge from-layer="263" from-port="2" to-layer="265" to-port="0" />
<edge from-layer="264" from-port="0" to-layer="265" to-port="1" />
<edge from-layer="265" from-port="2" to-layer="268" to-port="0" />
<edge from-layer="266" from-port="0" to-layer="267" to-port="0" />
<edge from-layer="267" from-port="1" to-layer="268" to-port="1" />
<edge from-layer="268" from-port="2" to-layer="271" to-port="0" />
<edge from-layer="269" from-port="0" to-layer="270" to-port="0" />
<edge from-layer="270" from-port="1" to-layer="271" to-port="1" />
<edge from-layer="271" from-port="2" to-layer="294" to-port="0" />
<edge from-layer="271" from-port="2" to-layer="312" to-port="0" />
<edge from-layer="271" from-port="2" to-layer="284" to-port="0" />
<edge from-layer="271" from-port="2" to-layer="274" to-port="0" />
<edge from-layer="272" from-port="0" to-layer="273" to-port="0" />
<edge from-layer="273" from-port="1" to-layer="274" to-port="1" />
<edge from-layer="274" from-port="2" to-layer="277" to-port="0" />
<edge from-layer="275" from-port="0" to-layer="276" to-port="0" />
<edge from-layer="276" from-port="1" to-layer="277" to-port="1" />
<edge from-layer="277" from-port="2" to-layer="279" to-port="0" />
<edge from-layer="278" from-port="0" to-layer="279" to-port="1" />
<edge from-layer="279" from-port="2" to-layer="281" to-port="0" />
<edge from-layer="280" from-port="0" to-layer="281" to-port="1" />
<edge from-layer="281" from-port="2" to-layer="302" to-port="0" />
<edge from-layer="282" from-port="0" to-layer="283" to-port="0" />
<edge from-layer="283" from-port="1" to-layer="284" to-port="1" />
<edge from-layer="284" from-port="2" to-layer="287" to-port="0" />
<edge from-layer="285" from-port="0" to-layer="286" to-port="0" />
<edge from-layer="286" from-port="1" to-layer="287" to-port="1" />
<edge from-layer="287" from-port="2" to-layer="289" to-port="0" />
<edge from-layer="288" from-port="0" to-layer="289" to-port="1" />
<edge from-layer="289" from-port="2" to-layer="291" to-port="0" />
<edge from-layer="290" from-port="0" to-layer="291" to-port="1" />
<edge from-layer="291" from-port="2" to-layer="302" to-port="1" />
<edge from-layer="292" from-port="0" to-layer="293" to-port="0" />
<edge from-layer="293" from-port="1" to-layer="294" to-port="1" />
<edge from-layer="294" from-port="2" to-layer="297" to-port="0" />
<edge from-layer="295" from-port="0" to-layer="296" to-port="0" />
<edge from-layer="296" from-port="1" to-layer="297" to-port="1" />
<edge from-layer="297" from-port="2" to-layer="299" to-port="0" />
<edge from-layer="298" from-port="0" to-layer="299" to-port="1" />
<edge from-layer="299" from-port="2" to-layer="301" to-port="0" />
<edge from-layer="300" from-port="0" to-layer="301" to-port="1" />
<edge from-layer="301" from-port="2" to-layer="302" to-port="2" />
<edge from-layer="302" from-port="4" to-layer="304" to-port="0" />
<edge from-layer="303" from-port="0" to-layer="304" to-port="1" />
<edge from-layer="304" from-port="2" to-layer="305" to-port="0" />
<edge from-layer="305" from-port="2" to-layer="308" to-port="0" />
<edge from-layer="306" from-port="0" to-layer="307" to-port="0" />
<edge from-layer="307" from-port="1" to-layer="308" to-port="1" />
<edge from-layer="308" from-port="2" to-layer="311" to-port="0" />
<edge from-layer="309" from-port="0" to-layer="310" to-port="0" />
<edge from-layer="310" from-port="1" to-layer="311" to-port="1" />
<edge from-layer="311" from-port="2" to-layer="312" to-port="1" />
<edge from-layer="312" from-port="2" to-layer="314" to-port="0" />
<edge from-layer="313" from-port="0" to-layer="314" to-port="1" />
<edge from-layer="314" from-port="2" to-layer="317" to-port="0" />
<edge from-layer="315" from-port="0" to-layer="316" to-port="0" />
<edge from-layer="316" from-port="1" to-layer="317" to-port="1" />
<edge from-layer="317" from-port="2" to-layer="320" to-port="0" />
<edge from-layer="318" from-port="0" to-layer="319" to-port="0" />
<edge from-layer="319" from-port="1" to-layer="320" to-port="1" />
<edge from-layer="320" from-port="2" to-layer="334" to-port="0" />
<edge from-layer="320" from-port="2" to-layer="323" to-port="0" />
<edge from-layer="321" from-port="0" to-layer="322" to-port="0" />
<edge from-layer="322" from-port="1" to-layer="323" to-port="1" />
<edge from-layer="323" from-port="2" to-layer="326" to-port="0" />
<edge from-layer="324" from-port="0" to-layer="325" to-port="0" />
<edge from-layer="325" from-port="1" to-layer="326" to-port="1" />
<edge from-layer="326" from-port="2" to-layer="327" to-port="0" />
<edge from-layer="327" from-port="1" to-layer="330" to-port="0" />
<edge from-layer="328" from-port="0" to-layer="329" to-port="0" />
<edge from-layer="329" from-port="1" to-layer="330" to-port="1" />
<edge from-layer="330" from-port="2" to-layer="333" to-port="0" />
<edge from-layer="331" from-port="0" to-layer="332" to-port="0" />
<edge from-layer="332" from-port="1" to-layer="333" to-port="1" />
<edge from-layer="333" from-port="2" to-layer="334" to-port="1" />
<edge from-layer="334" from-port="2" to-layer="336" to-port="0" />
<edge from-layer="335" from-port="0" to-layer="336" to-port="1" />
<edge from-layer="336" from-port="2" to-layer="339" to-port="0" />
<edge from-layer="337" from-port="0" to-layer="338" to-port="0" />
<edge from-layer="338" from-port="1" to-layer="339" to-port="1" />
<edge from-layer="339" from-port="2" to-layer="342" to-port="0" />
<edge from-layer="340" from-port="0" to-layer="341" to-port="0" />
<edge from-layer="341" from-port="1" to-layer="342" to-port="1" />
<edge from-layer="342" from-port="2" to-layer="345" to-port="0" />
<edge from-layer="342" from-port="2" to-layer="383" to-port="0" />
<edge from-layer="342" from-port="2" to-layer="365" to-port="0" />
<edge from-layer="342" from-port="2" to-layer="355" to-port="0" />
<edge from-layer="343" from-port="0" to-layer="344" to-port="0" />
<edge from-layer="344" from-port="1" to-layer="345" to-port="1" />
<edge from-layer="345" from-port="2" to-layer="348" to-port="0" />
<edge from-layer="346" from-port="0" to-layer="347" to-port="0" />
<edge from-layer="347" from-port="1" to-layer="348" to-port="1" />
<edge from-layer="348" from-port="2" to-layer="350" to-port="0" />
<edge from-layer="349" from-port="0" to-layer="350" to-port="1" />
<edge from-layer="350" from-port="2" to-layer="352" to-port="0" />
<edge from-layer="351" from-port="0" to-layer="352" to-port="1" />
<edge from-layer="352" from-port="2" to-layer="373" to-port="0" />
<edge from-layer="353" from-port="0" to-layer="354" to-port="0" />
<edge from-layer="354" from-port="1" to-layer="355" to-port="1" />
<edge from-layer="355" from-port="2" to-layer="358" to-port="0" />
<edge from-layer="356" from-port="0" to-layer="357" to-port="0" />
<edge from-layer="357" from-port="1" to-layer="358" to-port="1" />
<edge from-layer="358" from-port="2" to-layer="360" to-port="0" />
<edge from-layer="359" from-port="0" to-layer="360" to-port="1" />
<edge from-layer="360" from-port="2" to-layer="362" to-port="0" />
<edge from-layer="361" from-port="0" to-layer="362" to-port="1" />
<edge from-layer="362" from-port="2" to-layer="373" to-port="1" />
<edge from-layer="363" from-port="0" to-layer="364" to-port="0" />
<edge from-layer="364" from-port="1" to-layer="365" to-port="1" />
<edge from-layer="365" from-port="2" to-layer="368" to-port="0" />
<edge from-layer="366" from-port="0" to-layer="367" to-port="0" />
<edge from-layer="367" from-port="1" to-layer="368" to-port="1" />
<edge from-layer="368" from-port="2" to-layer="370" to-port="0" />
<edge from-layer="369" from-port="0" to-layer="370" to-port="1" />
<edge from-layer="370" from-port="2" to-layer="372" to-port="0" />
<edge from-layer="371" from-port="0" to-layer="372" to-port="1" />
<edge from-layer="372" from-port="2" to-layer="373" to-port="2" />
<edge from-layer="373" from-port="4" to-layer="375" to-port="0" />
<edge from-layer="374" from-port="0" to-layer="375" to-port="1" />
<edge from-layer="375" from-port="2" to-layer="376" to-port="0" />
<edge from-layer="376" from-port="2" to-layer="379" to-port="0" />
<edge from-layer="377" from-port="0" to-layer="378" to-port="0" />
<edge from-layer="378" from-port="1" to-layer="379" to-port="1" />
<edge from-layer="379" from-port="2" to-layer="382" to-port="0" />
<edge from-layer="380" from-port="0" to-layer="381" to-port="0" />
<edge from-layer="381" from-port="1" to-layer="382" to-port="1" />
<edge from-layer="382" from-port="2" to-layer="383" to-port="1" />
<edge from-layer="383" from-port="2" to-layer="385" to-port="0" />
<edge from-layer="384" from-port="0" to-layer="385" to-port="1" />
<edge from-layer="385" from-port="2" to-layer="388" to-port="0" />
<edge from-layer="386" from-port="0" to-layer="387" to-port="0" />
<edge from-layer="387" from-port="1" to-layer="388" to-port="1" />
<edge from-layer="388" from-port="2" to-layer="391" to-port="0" />
<edge from-layer="389" from-port="0" to-layer="390" to-port="0" />
<edge from-layer="390" from-port="1" to-layer="391" to-port="1" />
<edge from-layer="391" from-port="2" to-layer="405" to-port="0" />
<edge from-layer="391" from-port="2" to-layer="394" to-port="0" />
<edge from-layer="392" from-port="0" to-layer="393" to-port="0" />
<edge from-layer="393" from-port="1" to-layer="394" to-port="1" />
<edge from-layer="394" from-port="2" to-layer="397" to-port="0" />
<edge from-layer="395" from-port="0" to-layer="396" to-port="0" />
<edge from-layer="396" from-port="1" to-layer="397" to-port="1" />
<edge from-layer="397" from-port="2" to-layer="398" to-port="0" />
<edge from-layer="398" from-port="1" to-layer="401" to-port="0" />
<edge from-layer="399" from-port="0" to-layer="400" to-port="0" />
<edge from-layer="400" from-port="1" to-layer="401" to-port="1" />
<edge from-layer="401" from-port="2" to-layer="404" to-port="0" />
<edge from-layer="402" from-port="0" to-layer="403" to-port="0" />
<edge from-layer="403" from-port="1" to-layer="404" to-port="1" />
<edge from-layer="404" from-port="2" to-layer="405" to-port="1" />
<edge from-layer="405" from-port="2" to-layer="407" to-port="0" />
<edge from-layer="406" from-port="0" to-layer="407" to-port="1" />
<edge from-layer="407" from-port="2" to-layer="410" to-port="0" />
<edge from-layer="408" from-port="0" to-layer="409" to-port="0" />
<edge from-layer="409" from-port="1" to-layer="410" to-port="1" />
<edge from-layer="410" from-port="2" to-layer="413" to-port="0" />
<edge from-layer="411" from-port="0" to-layer="412" to-port="0" />
<edge from-layer="412" from-port="1" to-layer="413" to-port="1" />
<edge from-layer="413" from-port="2" to-layer="416" to-port="0" />
<edge from-layer="413" from-port="2" to-layer="454" to-port="0" />
<edge from-layer="413" from-port="2" to-layer="436" to-port="0" />
<edge from-layer="413" from-port="2" to-layer="426" to-port="0" />
<edge from-layer="414" from-port="0" to-layer="415" to-port="0" />
<edge from-layer="415" from-port="1" to-layer="416" to-port="1" />
<edge from-layer="416" from-port="2" to-layer="419" to-port="0" />
<edge from-layer="417" from-port="0" to-layer="418" to-port="0" />
<edge from-layer="418" from-port="1" to-layer="419" to-port="1" />
<edge from-layer="419" from-port="2" to-layer="421" to-port="0" />
<edge from-layer="420" from-port="0" to-layer="421" to-port="1" />
<edge from-layer="421" from-port="2" to-layer="423" to-port="0" />
<edge from-layer="422" from-port="0" to-layer="423" to-port="1" />
<edge from-layer="423" from-port="2" to-layer="444" to-port="0" />
<edge from-layer="424" from-port="0" to-layer="425" to-port="0" />
<edge from-layer="425" from-port="1" to-layer="426" to-port="1" />
<edge from-layer="426" from-port="2" to-layer="429" to-port="0" />
<edge from-layer="427" from-port="0" to-layer="428" to-port="0" />
<edge from-layer="428" from-port="1" to-layer="429" to-port="1" />
<edge from-layer="429" from-port="2" to-layer="431" to-port="0" />
<edge from-layer="430" from-port="0" to-layer="431" to-port="1" />
<edge from-layer="431" from-port="2" to-layer="433" to-port="0" />
<edge from-layer="432" from-port="0" to-layer="433" to-port="1" />
<edge from-layer="433" from-port="2" to-layer="444" to-port="1" />
<edge from-layer="434" from-port="0" to-layer="435" to-port="0" />
<edge from-layer="435" from-port="1" to-layer="436" to-port="1" />
<edge from-layer="436" from-port="2" to-layer="439" to-port="0" />
<edge from-layer="437" from-port="0" to-layer="438" to-port="0" />
<edge from-layer="438" from-port="1" to-layer="439" to-port="1" />
<edge from-layer="439" from-port="2" to-layer="441" to-port="0" />
<edge from-layer="440" from-port="0" to-layer="441" to-port="1" />
<edge from-layer="441" from-port="2" to-layer="443" to-port="0" />
<edge from-layer="442" from-port="0" to-layer="443" to-port="1" />
<edge from-layer="443" from-port="2" to-layer="444" to-port="2" />
<edge from-layer="444" from-port="4" to-layer="446" to-port="0" />
<edge from-layer="445" from-port="0" to-layer="446" to-port="1" />
<edge from-layer="446" from-port="2" to-layer="447" to-port="0" />
<edge from-layer="447" from-port="2" to-layer="450" to-port="0" />
<edge from-layer="448" from-port="0" to-layer="449" to-port="0" />
<edge from-layer="449" from-port="1" to-layer="450" to-port="1" />
<edge from-layer="450" from-port="2" to-layer="453" to-port="0" />
<edge from-layer="451" from-port="0" to-layer="452" to-port="0" />
<edge from-layer="452" from-port="1" to-layer="453" to-port="1" />
<edge from-layer="453" from-port="2" to-layer="454" to-port="1" />
<edge from-layer="454" from-port="2" to-layer="456" to-port="0" />
<edge from-layer="455" from-port="0" to-layer="456" to-port="1" />
<edge from-layer="456" from-port="2" to-layer="459" to-port="0" />
<edge from-layer="457" from-port="0" to-layer="458" to-port="0" />
<edge from-layer="458" from-port="1" to-layer="459" to-port="1" />
<edge from-layer="459" from-port="2" to-layer="462" to-port="0" />
<edge from-layer="460" from-port="0" to-layer="461" to-port="0" />
<edge from-layer="461" from-port="1" to-layer="462" to-port="1" />
<edge from-layer="462" from-port="2" to-layer="465" to-port="0" />
<edge from-layer="462" from-port="2" to-layer="476" to-port="0" />
<edge from-layer="463" from-port="0" to-layer="464" to-port="0" />
<edge from-layer="464" from-port="1" to-layer="465" to-port="1" />
<edge from-layer="465" from-port="2" to-layer="468" to-port="0" />
<edge from-layer="466" from-port="0" to-layer="467" to-port="0" />
<edge from-layer="467" from-port="1" to-layer="468" to-port="1" />
<edge from-layer="468" from-port="2" to-layer="469" to-port="0" />
<edge from-layer="469" from-port="1" to-layer="472" to-port="0" />
<edge from-layer="470" from-port="0" to-layer="471" to-port="0" />
<edge from-layer="471" from-port="1" to-layer="472" to-port="1" />
<edge from-layer="472" from-port="2" to-layer="475" to-port="0" />
<edge from-layer="473" from-port="0" to-layer="474" to-port="0" />
<edge from-layer="474" from-port="1" to-layer="475" to-port="1" />
<edge from-layer="475" from-port="2" to-layer="476" to-port="1" />
<edge from-layer="476" from-port="2" to-layer="478" to-port="0" />
<edge from-layer="477" from-port="0" to-layer="478" to-port="1" />
<edge from-layer="478" from-port="2" to-layer="481" to-port="0" />
<edge from-layer="479" from-port="0" to-layer="480" to-port="0" />
<edge from-layer="480" from-port="1" to-layer="481" to-port="1" />
<edge from-layer="481" from-port="2" to-layer="484" to-port="0" />
<edge from-layer="482" from-port="0" to-layer="483" to-port="0" />
<edge from-layer="483" from-port="1" to-layer="484" to-port="1" />
<edge from-layer="484" from-port="2" to-layer="485" to-port="0" />
</edges>
<rt_info>
<Runtime_version value="2025.3.0-19807-44526285f24-releases/2025/3" />
<conversion_parameters>
<framework value="pytorch" />
<is_python_object value="True" />
</conversion_parameters>
</rt_info>
</net>