stsb-TinyBERT-L4 / openvino /openvino_model_qint8_quantized.xml
tomaarsen's picture
tomaarsen HF Staff
Add exported openvino model 'openvino_model_qint8_quantized.xml'
1f47848 verified
<?xml version="1.0"?>
<net name="Model0" version="11">
<layers>
<layer id="2" name="input_ids" type="Parameter" version="opset1">
<data shape="?,?" element_type="i64" />
<output>
<port id="0" precision="I64" names="input_ids">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="1" name="attention_mask" type="Parameter" version="opset1">
<data shape="?,?" element_type="i64" />
<output>
<port id="0" precision="I64" names="attention_mask">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="0" name="token_type_ids" type="Parameter" version="opset1">
<data shape="?,?" element_type="i64" />
<output>
<port id="0" precision="I64" names="token_type_ids">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="3" name="Constant_149220" type="Const" version="opset1">
<data element_type="i8" shape="30522, 312" offset="0" size="9522864" />
<output>
<port id="0" precision="I8">
<dim>30522</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="4" name="Convert_149221" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>30522</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>30522</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="5" name="Constant_149222" type="Const" version="opset1">
<data element_type="f32" shape="30522, 1" offset="9522864" size="122088" />
<output>
<port id="0" precision="FP32">
<dim>30522</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="6" name="__module.bert.embeddings.word_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>30522</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>30522</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>30522</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="7" name="__module.bert.embeddings.word_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
<data destination_type="i32" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="8" name="__module.bert.embeddings.word_embeddings/aten::embedding/Constant" type="Const" version="opset1">
<data element_type="i32" shape="" offset="9644952" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="9" name="__module.bert.embeddings.word_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="FP32">
<dim>30522</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="FP32" names="48,inputs_embeds">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="10" name="Constant_149224" type="Const" version="opset1">
<data element_type="i8" shape="2, 312" offset="9644956" size="624" />
<output>
<port id="0" precision="I8">
<dim>2</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="11" name="Convert_149225" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>2</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>2</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="12" name="Constant_149226" type="Const" version="opset1">
<data element_type="f32" shape="2, 1" offset="9645580" size="8" />
<output>
<port id="0" precision="FP32">
<dim>2</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="13" name="__module.bert.embeddings.token_type_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>2</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>2</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>2</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="14" name="__module.bert.embeddings.token_type_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
<data destination_type="i32" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="15" name="__module.bert.embeddings.token_type_embeddings/aten::embedding/Constant" type="Const" version="opset1">
<data element_type="i32" shape="" offset="9644952" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="16" name="__module.bert.embeddings.token_type_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="FP32">
<dim>2</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="FP32" names="50,token_type_embeddings.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="17" name="__module.bert.embeddings/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="51_1">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="18" name="Constant_149228" type="Const" version="opset1">
<data element_type="i8" shape="512, 312" offset="9645588" size="159744" />
<output>
<port id="0" precision="I8">
<dim>512</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="19" name="Convert_149229" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>512</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="20" name="Constant_149230" type="Const" version="opset1">
<data element_type="f32" shape="512, 1" offset="9805332" size="2048" />
<output>
<port id="0" precision="FP32">
<dim>512</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="21" name="__module.bert.embeddings.position_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>512</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>512</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>512</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="22" name="__module.bert.embeddings/aten::slice/Slice" type="Const" version="opset1">
<data element_type="i64" shape="1, 512" offset="9807380" size="4096" />
<output>
<port id="0" precision="I64" names="45">
<dim>1</dim>
<dim>512</dim>
</port>
</output>
</layer>
<layer id="23" name="__module.bert.embeddings/aten::slice/Reshape" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="9811476" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="24" name="ShapeOf_5105" type="ShapeOf" version="opset3">
<data output_type="i64" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="25" name="Constant_5222" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="9811484" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="26" name="Constant_5107" type="Const" version="opset1">
<data element_type="i64" shape="" offset="9811476" size="8" />
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="27" name="Gather_5108" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I64">
<dim>2</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I64" names="35,41,43,44,61">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="28" name="__module.bert.embeddings/aten::slice/Reshape_2" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="9811484" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="29" name="__module.bert.embeddings/aten::slice/Reshape_3" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="9811484" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="30" name="__module.bert.embeddings/aten::slice/Slice_1" type="Slice" version="opset8">
<input>
<port id="0" precision="I64">
<dim>1</dim>
<dim>512</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64">
<dim>1</dim>
</port>
<port id="3" precision="I64">
<dim>1</dim>
</port>
<port id="4" precision="I64">
<dim>1</dim>
</port>
</input>
<output>
<port id="5" precision="I64" names="46">
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="31" name="__module.bert.embeddings.position_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
<data destination_type="i32" />
<input>
<port id="0" precision="I64">
<dim>1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="I32">
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="32" name="__module.bert.embeddings.position_embeddings/aten::embedding/Constant" type="Const" version="opset1">
<data element_type="i32" shape="" offset="9644952" size="4" />
<output>
<port id="0" precision="I32" />
</output>
</layer>
<layer id="33" name="__module.bert.embeddings.position_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="FP32">
<dim>512</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
<dim>-1</dim>
</port>
<port id="2" precision="I32" />
</input>
<output>
<port id="3" precision="FP32" names="53,position_embeddings.1">
<dim>1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="34" name="__module.bert.embeddings/aten::add_/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="51,embeddings.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="35" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="9811492" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="36" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="37" name="Constant_5012" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="9811496" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="38" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="39" name="Constant_5013" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="9812744" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="40" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="58,input.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="41" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="9813992" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="42" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="43" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="9815240" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="44" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="9815244" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="45" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="9815240" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="46" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="9815244" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="47" name="__module.bert.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="48" name="Constant_149232" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="9815248" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="49" name="Convert_149233" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="50" name="Constant_149234" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="9912592" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="51" name="__module.bert.encoder.layer.0.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="52" name="__module.bert.encoder.layer.0.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="53" name="Constant_5014" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="9913840" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="54" name="__module.bert.encoder.layer.0.attention.self.query/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="92,x.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="55" name="__module.bert.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="9915088" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="56" name="__module.bert.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="9915092" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="57" name="__module.bert.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="9915088" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="58" name="__module.bert.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="9915092" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="59" name="__module.bert.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="60" name="__module.bert.encoder.layer.0.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="61" name="__module.bert.encoder.layer.0.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="96,x.3">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="62" name="Constant_201" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="97">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="63" name="__module.bert.encoder.layer.0.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="98">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="64" name="Constant_149236" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="9915160" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="65" name="Convert_149237" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="66" name="Constant_149238" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="10012504" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="67" name="__module.bert.encoder.layer.0.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="68" name="__module.bert.encoder.layer.0.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="69" name="Constant_5015" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10013752" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="70" name="__module.bert.encoder.layer.0.attention.self.key/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="101,x.5">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="71" name="__module.bert.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10015000" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="72" name="__module.bert.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10015004" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="73" name="__module.bert.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10015000" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="74" name="__module.bert.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10015004" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="75" name="__module.bert.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="76" name="__module.bert.encoder.layer.0.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="77" name="__module.bert.encoder.layer.0.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="105,x.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="78" name="Constant_226" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="106">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="79" name="__module.bert.encoder.layer.0.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="107">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="80" name="Constant_149240" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="10015008" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="81" name="Convert_149241" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="82" name="Constant_149242" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="10112352" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="83" name="__module.bert.encoder.layer.0.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="84" name="__module.bert.encoder.layer.0.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="85" name="Constant_5016" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10113600" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="86" name="__module.bert.encoder.layer.0.attention.self.value/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="110,x.9">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="87" name="__module.bert.encoder.layer.0.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="88" name="__module.bert.encoder.layer.0.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="114,x.11">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="89" name="Constant_251" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="115">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="90" name="__module.bert.encoder.layer.0.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="116">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="91" name="Constant_5018" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1, 1" offset="10114848" size="4" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="92" name="31" type="Const" version="opset1">
<data element_type="i64" shape="" offset="9811484" size="8" />
<output>
<port id="0" precision="I64" names="31" />
</output>
</layer>
<layer id="93" name="__module.bert/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="I64" names="63">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="94" name="21" type="Const" version="opset1">
<data element_type="i64" shape="" offset="10114852" size="8" />
<output>
<port id="0" precision="I64" names="21" />
</output>
</layer>
<layer id="95" name="__module.bert/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1">
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64" />
</input>
<output>
<port id="2" precision="I64" names="64,65">
<dim>-1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="96" name="Constant_5114" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="9811476" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="97" name="Constant_5115" type="Const" version="opset1">
<data element_type="i64" shape="" offset="9811476" size="8" />
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="98" name="Gather_5116" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I64">
<dim>2</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I64" names="60">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="99" name="Constant_4446" type="Const" version="opset1">
<data element_type="i64" shape="1" offset="9811484" size="8" />
<output>
<port id="0" precision="I64">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="100" name="Constant_5224" type="Const" version="opset1">
<data element_type="i64" shape="2" offset="10114860" size="16" />
<output>
<port id="0" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="101" name="Constant_5225" type="Const" version="opset1">
<data element_type="i64" shape="" offset="9811476" size="8" />
<output>
<port id="0" precision="I64" />
</output>
</layer>
<layer id="102" name="Gather_5226" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="I64">
<dim>2</dim>
</port>
<port id="1" precision="I64">
<dim>2</dim>
</port>
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="I64">
<dim>2</dim>
</port>
</output>
</layer>
<layer id="103" name="__module.bert/prim::ListConstruct/Concat" type="Concat" version="opset1">
<data axis="0" />
<input>
<port id="0" precision="I64">
<dim>1</dim>
</port>
<port id="1" precision="I64">
<dim>1</dim>
</port>
<port id="2" precision="I64">
<dim>2</dim>
</port>
</input>
<output>
<port id="3" precision="I64" names="66">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="104" name="__module.bert/aten::expand/Broadcast" type="Broadcast" version="opset3">
<data mode="bidirectional" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="I64" names="67">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="105" name="__module.bert/aten::to/Convert" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I64">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="68">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="106" name="Constant_5017" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1, 1" offset="10114848" size="4" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="107" name="__module.bert/aten::rsub/Multiply" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="108" name="__module.bert/aten::rsub/Subtract" type="Subtract" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
<dim>1</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="69,inverted_mask">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="109" name="__module.bert/aten::to/Convert_1" type="Convert" version="opset1">
<data destination_type="boolean" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="1" precision="BOOL" names="70">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="110" name="__module.bert/aten::masked_fill/ConvertLike" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10114876" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="111" name="__module.bert/aten::masked_fill/Select" type="Select" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="BOOL">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="3" precision="FP32" names="71">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</output>
</layer>
<layer id="112" name="__module.bert.encoder.layer.0.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="117,attn_output.1">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="113" name="__module.bert.encoder.layer.0.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="10114880" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="114" name="__module.bert.encoder.layer.0.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="118,attn_output.3">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="115" name="Constant_5121" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="10114896" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="116" name="__module.bert.encoder.layer.0.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="120">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="117" name="__module.bert.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10114920" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="118" name="__module.bert.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="119" name="__module.bert.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10116168" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="120" name="__module.bert.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10116172" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="121" name="__module.bert.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10116168" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="122" name="__module.bert.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10116172" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="123" name="__module.bert.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="124" name="Constant_149244" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="10116176" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="125" name="Convert_149245" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="126" name="Constant_149246" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="10213520" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="127" name="__module.bert.encoder.layer.0.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="128" name="__module.bert.encoder.layer.0.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="129" name="Constant_5019" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10214768" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="130" name="__module.bert.encoder.layer.0.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="125,input.3">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="131" name="__module.bert.encoder.layer.0.attention.output/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="127">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="132" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="9811492" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="133" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="134" name="Constant_5020" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10216016" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="135" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="136" name="Constant_5021" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10217264" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="137" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="131,input_tensor.1">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="138" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10218512" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="139" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="140" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10219760" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="141" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10219764" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="142" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10219760" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="143" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10219764" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="144" name="__module.bert.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="145" name="Constant_149248" type="Const" version="opset1">
<data element_type="i8" shape="1200, 312" offset="10219768" size="374400" />
<output>
<port id="0" precision="I8">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="146" name="Convert_149249" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>1200</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="147" name="Constant_149250" type="Const" version="opset1">
<data element_type="f32" shape="1200, 1" offset="10594168" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1200</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="148" name="__module.bert.encoder.layer.0.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="149" name="__module.bert.encoder.layer.0.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="150" name="Constant_5022" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1200" offset="10598968" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="151" name="__module.bert.encoder.layer.0.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="135">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="152" name="__module.bert.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="136">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="153" name="__module.bert.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1200" offset="10603768" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="154" name="__module.bert.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="155" name="__module.bert.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10608568" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="156" name="__module.bert.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10608572" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="157" name="__module.bert.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10608568" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="158" name="__module.bert.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10608572" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="159" name="__module.bert.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="160" name="Constant_149252" type="Const" version="opset1">
<data element_type="i8" shape="312, 1200" offset="10608576" size="374400" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="161" name="Convert_149253" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="162" name="Constant_149254" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="10982976" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="163" name="__module.bert.encoder.layer.0.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="164" name="__module.bert.encoder.layer.0.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="165" name="Constant_5023" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10984224" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="166" name="__module.bert.encoder.layer.0.output.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="141,input.5">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="167" name="__module.bert.encoder.layer.0.output/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="143">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="168" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="9811492" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="169" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="170" name="Constant_5024" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10985472" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="171" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="172" name="Constant_5025" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10986720" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="173" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="147,hidden_states.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="174" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="10987968" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="175" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="176" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10989216" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="177" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10989220" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="178" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10989216" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="179" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="10989220" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="180" name="__module.bert.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="181" name="Constant_149256" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="10989224" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="182" name="Convert_149257" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="183" name="Constant_149258" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="11086568" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="184" name="__module.bert.encoder.layer.1.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="185" name="__module.bert.encoder.layer.1.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="186" name="Constant_5026" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="11087816" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="187" name="__module.bert.encoder.layer.1.attention.self.query/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="160,x.13">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="188" name="__module.bert.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11089064" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="189" name="__module.bert.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11089068" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="190" name="__module.bert.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11089064" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="191" name="__module.bert.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11089068" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="192" name="__module.bert.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="193" name="__module.bert.encoder.layer.1.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="194" name="__module.bert.encoder.layer.1.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="164,x.15">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="195" name="Constant_430" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="165">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="196" name="__module.bert.encoder.layer.1.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="166">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="197" name="Constant_149260" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="11089072" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="198" name="Convert_149261" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="199" name="Constant_149262" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="11186416" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="200" name="__module.bert.encoder.layer.1.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="201" name="__module.bert.encoder.layer.1.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="202" name="Constant_5027" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="11187664" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="203" name="__module.bert.encoder.layer.1.attention.self.key/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="169,x.17">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="204" name="__module.bert.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11188912" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="205" name="__module.bert.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11188916" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="206" name="__module.bert.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11188912" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="207" name="__module.bert.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11188916" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="208" name="__module.bert.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="209" name="__module.bert.encoder.layer.1.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="210" name="__module.bert.encoder.layer.1.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="173,x.19">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="211" name="Constant_453" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="174">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="212" name="__module.bert.encoder.layer.1.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="175">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="213" name="Constant_149264" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="11188920" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="214" name="Convert_149265" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="215" name="Constant_149266" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="11286264" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="216" name="__module.bert.encoder.layer.1.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="217" name="__module.bert.encoder.layer.1.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="218" name="Constant_5028" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="11287512" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="219" name="__module.bert.encoder.layer.1.attention.self.value/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="178,x.21">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="220" name="__module.bert.encoder.layer.1.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="221" name="__module.bert.encoder.layer.1.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="182,x.23">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="222" name="Constant_476" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="183">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="223" name="__module.bert.encoder.layer.1.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="184">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="224" name="__module.bert.encoder.layer.1.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="185,attn_output.5">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="225" name="__module.bert.encoder.layer.1.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="10114880" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="226" name="__module.bert.encoder.layer.1.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="186,attn_output.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="227" name="Constant_5122" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="10114896" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="228" name="__module.bert.encoder.layer.1.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="188">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="229" name="__module.bert.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="11288760" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="230" name="__module.bert.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="231" name="__module.bert.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11290008" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="232" name="__module.bert.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11290012" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="233" name="__module.bert.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11290008" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="234" name="__module.bert.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11290012" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="235" name="__module.bert.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="236" name="Constant_149268" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="11290016" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="237" name="Convert_149269" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="238" name="Constant_149270" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="11387360" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="239" name="__module.bert.encoder.layer.1.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="240" name="__module.bert.encoder.layer.1.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="241" name="Constant_5029" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="11388608" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="242" name="__module.bert.encoder.layer.1.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="193,input.7">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="243" name="__module.bert.encoder.layer.1.attention.output/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="195">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="244" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="9811492" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="245" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="246" name="Constant_5030" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="11389856" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="247" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="248" name="Constant_5031" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="11391104" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="249" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="199,input_tensor.3">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="250" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="11392352" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="251" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="252" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11393600" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="253" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11393604" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="254" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11393600" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="255" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11393604" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="256" name="__module.bert.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="257" name="Constant_149272" type="Const" version="opset1">
<data element_type="i8" shape="1200, 312" offset="11393608" size="374400" />
<output>
<port id="0" precision="I8">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="258" name="Convert_149273" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>1200</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="259" name="Constant_149274" type="Const" version="opset1">
<data element_type="f32" shape="1200, 1" offset="11768008" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1200</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="260" name="__module.bert.encoder.layer.1.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="261" name="__module.bert.encoder.layer.1.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="262" name="Constant_5032" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1200" offset="11772808" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="263" name="__module.bert.encoder.layer.1.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="203">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="264" name="__module.bert.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="204">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="265" name="__module.bert.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1200" offset="11777608" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="266" name="__module.bert.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="267" name="__module.bert.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11782408" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="268" name="__module.bert.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11782412" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="269" name="__module.bert.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11782408" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="270" name="__module.bert.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="11782412" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="271" name="__module.bert.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="272" name="Constant_149276" type="Const" version="opset1">
<data element_type="i8" shape="312, 1200" offset="11782416" size="374400" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="273" name="Convert_149277" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="274" name="Constant_149278" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="12156816" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="275" name="__module.bert.encoder.layer.1.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="276" name="__module.bert.encoder.layer.1.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="277" name="Constant_5033" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12158064" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="278" name="__module.bert.encoder.layer.1.output.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="209,input.9">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="279" name="__module.bert.encoder.layer.1.output/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="211">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="280" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="9811492" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="281" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="282" name="Constant_5034" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12159312" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="283" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="284" name="Constant_5035" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12160560" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="285" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="215,hidden_states.13">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="286" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12161808" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="287" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="288" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12163056" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="289" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12163060" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="290" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12163056" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="291" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12163060" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="292" name="__module.bert.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="293" name="Constant_149280" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="12163064" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="294" name="Convert_149281" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="295" name="Constant_149282" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="12260408" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="296" name="__module.bert.encoder.layer.2.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="297" name="__module.bert.encoder.layer.2.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="298" name="Constant_5036" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12261656" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="299" name="__module.bert.encoder.layer.2.attention.self.query/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="228,x.25">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="300" name="__module.bert.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12262904" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="301" name="__module.bert.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12262908" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="302" name="__module.bert.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12262904" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="303" name="__module.bert.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12262908" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="304" name="__module.bert.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="305" name="__module.bert.encoder.layer.2.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="306" name="__module.bert.encoder.layer.2.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="232,x.27">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="307" name="Constant_653" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="233">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="308" name="__module.bert.encoder.layer.2.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="234">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="309" name="Constant_149284" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="12262912" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="310" name="Convert_149285" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="311" name="Constant_149286" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="12360256" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="312" name="__module.bert.encoder.layer.2.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="313" name="__module.bert.encoder.layer.2.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="314" name="Constant_5037" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12361504" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="315" name="__module.bert.encoder.layer.2.attention.self.key/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="237,x.29">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="316" name="__module.bert.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12362752" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="317" name="__module.bert.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12362756" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="318" name="__module.bert.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12362752" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="319" name="__module.bert.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12362756" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="320" name="__module.bert.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="321" name="__module.bert.encoder.layer.2.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="322" name="__module.bert.encoder.layer.2.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="241,x.31">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="323" name="Constant_676" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="242">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="324" name="__module.bert.encoder.layer.2.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="243">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="325" name="Constant_149288" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="12362760" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="326" name="Convert_149289" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="327" name="Constant_149290" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="12460104" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="328" name="__module.bert.encoder.layer.2.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="329" name="__module.bert.encoder.layer.2.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="330" name="Constant_5038" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12461352" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="331" name="__module.bert.encoder.layer.2.attention.self.value/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="246,x.33">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="332" name="__module.bert.encoder.layer.2.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="333" name="__module.bert.encoder.layer.2.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="250,x.35">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="334" name="Constant_699" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="251">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="335" name="__module.bert.encoder.layer.2.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="252">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="336" name="__module.bert.encoder.layer.2.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="253,attn_output.9">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="337" name="__module.bert.encoder.layer.2.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="10114880" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="338" name="__module.bert.encoder.layer.2.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="254,attn_output.11">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="339" name="Constant_5123" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="10114896" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="340" name="__module.bert.encoder.layer.2.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="256">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="341" name="__module.bert.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12462600" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="342" name="__module.bert.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="343" name="__module.bert.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12463848" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="344" name="__module.bert.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12463852" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="345" name="__module.bert.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12463848" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="346" name="__module.bert.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12463852" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="347" name="__module.bert.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="348" name="Constant_149292" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="12463856" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="349" name="Convert_149293" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="350" name="Constant_149294" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="12561200" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="351" name="__module.bert.encoder.layer.2.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="352" name="__module.bert.encoder.layer.2.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="353" name="Constant_5039" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12562448" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="354" name="__module.bert.encoder.layer.2.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="261,input.11">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="355" name="__module.bert.encoder.layer.2.attention.output/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="263">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="356" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="9811492" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="357" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="358" name="Constant_5040" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12563696" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="359" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="360" name="Constant_5041" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12564944" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="361" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="267,input_tensor.5">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="362" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="12566192" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="363" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="364" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12567440" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="365" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12567444" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="366" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12567440" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="367" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12567444" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="368" name="__module.bert.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="369" name="Constant_149296" type="Const" version="opset1">
<data element_type="i8" shape="1200, 312" offset="12567448" size="374400" />
<output>
<port id="0" precision="I8">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="370" name="Convert_149297" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>1200</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="371" name="Constant_149298" type="Const" version="opset1">
<data element_type="f32" shape="1200, 1" offset="12941848" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1200</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="372" name="__module.bert.encoder.layer.2.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="373" name="__module.bert.encoder.layer.2.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="374" name="Constant_5042" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1200" offset="12946648" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="375" name="__module.bert.encoder.layer.2.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="271">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="376" name="__module.bert.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="272">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="377" name="__module.bert.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1200" offset="12951448" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="378" name="__module.bert.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="379" name="__module.bert.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12956248" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="380" name="__module.bert.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12956252" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="381" name="__module.bert.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12956248" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="382" name="__module.bert.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="12956252" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="383" name="__module.bert.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="384" name="Constant_149300" type="Const" version="opset1">
<data element_type="i8" shape="312, 1200" offset="12956256" size="374400" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="385" name="Convert_149301" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="386" name="Constant_149302" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="13330656" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="387" name="__module.bert.encoder.layer.2.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="388" name="__module.bert.encoder.layer.2.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="389" name="Constant_5043" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13331904" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="390" name="__module.bert.encoder.layer.2.output.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="277,input.13">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="391" name="__module.bert.encoder.layer.2.output/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="279">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="392" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="9811492" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="393" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="394" name="Constant_5044" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13333152" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="395" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="396" name="Constant_5045" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13334400" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="397" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="283,hidden_states.19">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="398" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13335648" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="399" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="400" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13336896" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="401" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13336900" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="402" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13336896" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="403" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13336900" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="404" name="__module.bert.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="405" name="Constant_149304" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="13336904" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="406" name="Convert_149305" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="407" name="Constant_149306" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="13434248" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="408" name="__module.bert.encoder.layer.3.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="409" name="__module.bert.encoder.layer.3.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="410" name="Constant_5046" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13435496" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="411" name="__module.bert.encoder.layer.3.attention.self.query/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="296,x.37">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="412" name="__module.bert.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13436744" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="413" name="__module.bert.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13436748" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="414" name="__module.bert.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13436744" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="415" name="__module.bert.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13436748" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="416" name="__module.bert.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="417" name="__module.bert.encoder.layer.3.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="418" name="__module.bert.encoder.layer.3.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="300,x.39">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="419" name="Constant_876" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="301">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="420" name="__module.bert.encoder.layer.3.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="302">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="421" name="Constant_149308" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="13436752" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="422" name="Convert_149309" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="423" name="Constant_149310" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="13534096" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="424" name="__module.bert.encoder.layer.3.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="425" name="__module.bert.encoder.layer.3.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="426" name="Constant_5047" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13535344" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="427" name="__module.bert.encoder.layer.3.attention.self.key/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="305,x.41">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="428" name="__module.bert.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13536592" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="429" name="__module.bert.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13536596" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="430" name="__module.bert.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13536592" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="431" name="__module.bert.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13536596" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="432" name="__module.bert.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="433" name="__module.bert.encoder.layer.3.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="434" name="__module.bert.encoder.layer.3.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="309,x.43">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="435" name="Constant_899" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="310">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="436" name="__module.bert.encoder.layer.3.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="311">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="437" name="Constant_149312" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="13536600" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="438" name="Convert_149313" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="439" name="Constant_149314" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="13633944" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="440" name="__module.bert.encoder.layer.3.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="441" name="__module.bert.encoder.layer.3.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="442" name="Constant_5048" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13635192" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="443" name="__module.bert.encoder.layer.3.attention.self.value/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="314,x.45">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="444" name="__module.bert.encoder.layer.3.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915096" size="32" />
<output>
<port id="0" precision="I64">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="445" name="__module.bert.encoder.layer.3.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="318,x">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="446" name="Constant_922" type="Const" version="opset1">
<data element_type="i64" shape="4" offset="9915128" size="32" />
<output>
<port id="0" precision="I64" names="319">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="447" name="__module.bert.encoder.layer.3.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="320">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="448" name="__module.bert.encoder.layer.3.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
<data causal="false" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="3" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
<dim>-1</dim>
<dim>-1</dim>
</port>
</input>
<output>
<port id="4" precision="FP32" names="321,attn_output.13">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="449" name="__module.bert.encoder.layer.3.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
<data element_type="i32" shape="4" offset="10114880" size="16" />
<output>
<port id="0" precision="I32">
<dim>4</dim>
</port>
</output>
</layer>
<layer id="450" name="__module.bert.encoder.layer.3.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>12</dim>
<dim>-1</dim>
<dim>26</dim>
</port>
<port id="1" precision="I32">
<dim>4</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="322,attn_output">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
</output>
</layer>
<layer id="451" name="Constant_5124" type="Const" version="opset1">
<data element_type="i64" shape="3" offset="10114896" size="24" />
<output>
<port id="0" precision="I64">
<dim>3</dim>
</port>
</output>
</layer>
<layer id="452" name="__module.bert.encoder.layer.3.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
<data special_zero="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>12</dim>
<dim>26</dim>
</port>
<port id="1" precision="I64">
<dim>3</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="324">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="453" name="__module.bert.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13636440" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="454" name="__module.bert.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="455" name="__module.bert.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13637688" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="456" name="__module.bert.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13637692" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="457" name="__module.bert.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13637688" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="458" name="__module.bert.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13637692" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="459" name="__module.bert.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="460" name="Constant_149316" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="13637696" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="461" name="Convert_149317" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="462" name="Constant_149318" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="13735040" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="463" name="__module.bert.encoder.layer.3.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="464" name="__module.bert.encoder.layer.3.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="465" name="Constant_5049" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13736288" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="466" name="__module.bert.encoder.layer.3.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="329,input.15">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="467" name="__module.bert.encoder.layer.3.attention.output/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="331">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="468" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="9811492" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="469" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="470" name="Constant_5050" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13737536" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="471" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="472" name="Constant_5051" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13738784" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="473" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="335,input_tensor">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="474" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="13740032" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="475" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="476" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13741280" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="477" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13741284" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="478" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13741280" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="479" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="13741284" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="480" name="__module.bert.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="481" name="Constant_149320" type="Const" version="opset1">
<data element_type="i8" shape="1200, 312" offset="13741288" size="374400" />
<output>
<port id="0" precision="I8">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="482" name="Convert_149321" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>1200</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="483" name="Constant_149322" type="Const" version="opset1">
<data element_type="f32" shape="1200, 1" offset="14115688" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1200</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="484" name="__module.bert.encoder.layer.3.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="485" name="__module.bert.encoder.layer.3.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1200</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="486" name="Constant_5052" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1200" offset="14120488" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="487" name="__module.bert.encoder.layer.3.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="339">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="488" name="__module.bert.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
<data approximation_mode="ERF" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="340">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="489" name="__module.bert.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 1200" offset="14125288" size="4800" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="490" name="__module.bert.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="491" name="__module.bert.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14130088" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="492" name="__module.bert.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14130092" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="493" name="__module.bert.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14130088" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="494" name="__module.bert.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14130092" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="495" name="__module.bert.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="496" name="Constant_149324" type="Const" version="opset1">
<data element_type="i8" shape="312, 1200" offset="14130096" size="374400" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="497" name="Convert_149325" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="498" name="Constant_149326" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="14504496" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="499" name="__module.bert.encoder.layer.3.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</output>
</layer>
<layer id="500" name="__module.bert.encoder.layer.3.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>1200</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1200</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="501" name="Constant_5053" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="14505744" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="502" name="__module.bert.encoder.layer.3.output.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="345,input.17">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="503" name="__module.bert.encoder.layer.3.output/aten::add/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="347">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="504" name="__module.bert.encoder.layer.3.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
<data element_type="i32" shape="1" offset="9811492" size="4" />
<output>
<port id="0" precision="I32">
<dim>1</dim>
</port>
</output>
</layer>
<layer id="505" name="__module.bert.encoder.layer.3.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I32">
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="506" name="Constant_5054" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="14506992" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="507" name="__module.bert.encoder.layer.3.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="508" name="Constant_5055" type="Const" version="opset1">
<data element_type="f32" shape="1, 1, 312" offset="14508240" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="509" name="__module.bert.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="351,353,hidden_states">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="510" name="23" type="Const" version="opset1">
<data element_type="i64" shape="" offset="9811476" size="8" />
<output>
<port id="0" precision="I64" names="23" />
</output>
</layer>
<layer id="511" name="__module.bert.pooler/aten::select/Gather" type="Gather" version="opset8">
<data batch_dims="0" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="I64" />
<port id="2" precision="I64" />
</input>
<output>
<port id="3" precision="FP32" names="354">
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="512" name="__module.bert.pooler/aten::select/Gather_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 312" offset="14509488" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="513" name="__module.bert.pooler/aten::select/Gather_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="514" name="__module.bert.pooler/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14510736" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="515" name="__module.bert.pooler/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14510740" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="516" name="__module.bert.pooler/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14510736" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="517" name="__module.bert.pooler/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14510740" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="518" name="__module.bert.pooler/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="519" name="Constant_149328" type="Const" version="opset1">
<data element_type="i8" shape="312, 312" offset="14510744" size="97344" />
<output>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="520" name="Convert_149329" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="521" name="Constant_149330" type="Const" version="opset1">
<data element_type="f32" shape="312, 1" offset="14608088" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="522" name="__module.bert.pooler.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="523" name="__module.bert.pooler.dense/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>312</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="524" name="Constant_5056" type="Const" version="opset1">
<data element_type="f32" shape="1, 312" offset="14609336" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="525" name="__module.bert.pooler.dense/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="357">
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="526" name="__module.bert.pooler.activation/aten::tanh/Tanh" type="Tanh" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32" names="358,input">
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="527" name="__module.bert.pooler.activation/aten::tanh/Tanh_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
<data element_type="f32" shape="1, 312" offset="14610584" size="1248" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="528" name="__module.bert.pooler.activation/aten::tanh/Tanh_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="529" name="__module.bert.pooler.activation/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14611832" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="530" name="__module.bert.pooler.activation/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14611836" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="531" name="__module.bert.pooler.activation/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14611832" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="532" name="__module.bert.pooler.activation/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
<data element_type="f32" shape="" offset="14611836" size="4" />
<output>
<port id="0" precision="FP32" />
</output>
</layer>
<layer id="533" name="__module.bert.pooler.activation/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
<data levels="256" auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32" />
<port id="2" precision="FP32" />
<port id="3" precision="FP32" />
<port id="4" precision="FP32" />
</input>
<output>
<port id="5" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="534" name="Constant_149332" type="Const" version="opset1">
<data element_type="i8" shape="1, 312" offset="14611840" size="312" />
<output>
<port id="0" precision="I8">
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="535" name="Convert_149333" type="Convert" version="opset1">
<data destination_type="f32" />
<input>
<port id="0" precision="I8">
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="536" name="Constant_149334" type="Const" version="opset1">
<data element_type="f32" shape="1, 1" offset="14612152" size="4" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="537" name="__module.classifier/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
</output>
</layer>
<layer id="538" name="__module.classifier/aten::linear/MatMul" type="MatMul" version="opset1">
<data transpose_a="false" transpose_b="true" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>312</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>312</dim>
</port>
</input>
<output>
<port id="2" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="539" name="Constant_5057" type="Const" version="opset1">
<data element_type="f32" shape="1, 1" offset="14612156" size="4" />
<output>
<port id="0" precision="FP32">
<dim>1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="540" name="__module.classifier/aten::linear/Add" type="Add" version="opset1">
<data auto_broadcast="numpy" />
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
</port>
<port id="1" precision="FP32">
<dim>1</dim>
<dim>1</dim>
</port>
</input>
<output>
<port id="2" precision="FP32" names="logits">
<dim>-1</dim>
<dim>1</dim>
</port>
</output>
</layer>
<layer id="541" name="Result_1950" type="Result" version="opset1">
<input>
<port id="0" precision="FP32">
<dim>-1</dim>
<dim>1</dim>
</port>
</input>
</layer>
</layers>
<edges>
<edge from-layer="0" from-port="0" to-layer="14" to-port="0" />
<edge from-layer="1" from-port="0" to-layer="93" to-port="0" />
<edge from-layer="2" from-port="0" to-layer="7" to-port="0" />
<edge from-layer="2" from-port="0" to-layer="24" to-port="0" />
<edge from-layer="3" from-port="0" to-layer="4" to-port="0" />
<edge from-layer="4" from-port="1" to-layer="6" to-port="0" />
<edge from-layer="5" from-port="0" to-layer="6" to-port="1" />
<edge from-layer="6" from-port="2" to-layer="9" to-port="0" />
<edge from-layer="7" from-port="1" to-layer="9" to-port="1" />
<edge from-layer="8" from-port="0" to-layer="9" to-port="2" />
<edge from-layer="9" from-port="3" to-layer="17" to-port="0" />
<edge from-layer="10" from-port="0" to-layer="11" to-port="0" />
<edge from-layer="11" from-port="1" to-layer="13" to-port="0" />
<edge from-layer="12" from-port="0" to-layer="13" to-port="1" />
<edge from-layer="13" from-port="2" to-layer="16" to-port="0" />
<edge from-layer="14" from-port="1" to-layer="16" to-port="1" />
<edge from-layer="15" from-port="0" to-layer="16" to-port="2" />
<edge from-layer="16" from-port="3" to-layer="17" to-port="1" />
<edge from-layer="17" from-port="2" to-layer="34" to-port="0" />
<edge from-layer="18" from-port="0" to-layer="19" to-port="0" />
<edge from-layer="19" from-port="1" to-layer="21" to-port="0" />
<edge from-layer="20" from-port="0" to-layer="21" to-port="1" />
<edge from-layer="21" from-port="2" to-layer="33" to-port="0" />
<edge from-layer="22" from-port="0" to-layer="30" to-port="0" />
<edge from-layer="23" from-port="0" to-layer="30" to-port="1" />
<edge from-layer="24" from-port="1" to-layer="27" to-port="0" />
<edge from-layer="24" from-port="1" to-layer="102" to-port="0" />
<edge from-layer="24" from-port="1" to-layer="98" to-port="0" />
<edge from-layer="25" from-port="0" to-layer="27" to-port="1" />
<edge from-layer="26" from-port="0" to-layer="27" to-port="2" />
<edge from-layer="27" from-port="3" to-layer="30" to-port="2" />
<edge from-layer="28" from-port="0" to-layer="30" to-port="3" />
<edge from-layer="29" from-port="0" to-layer="30" to-port="4" />
<edge from-layer="30" from-port="5" to-layer="31" to-port="0" />
<edge from-layer="31" from-port="1" to-layer="33" to-port="1" />
<edge from-layer="32" from-port="0" to-layer="33" to-port="2" />
<edge from-layer="33" from-port="3" to-layer="34" to-port="1" />
<edge from-layer="34" from-port="2" to-layer="36" to-port="0" />
<edge from-layer="35" from-port="0" to-layer="36" to-port="1" />
<edge from-layer="36" from-port="2" to-layer="38" to-port="0" />
<edge from-layer="37" from-port="0" to-layer="38" to-port="1" />
<edge from-layer="38" from-port="2" to-layer="40" to-port="0" />
<edge from-layer="39" from-port="0" to-layer="40" to-port="1" />
<edge from-layer="40" from-port="2" to-layer="131" to-port="1" />
<edge from-layer="40" from-port="2" to-layer="42" to-port="0" />
<edge from-layer="41" from-port="0" to-layer="42" to-port="1" />
<edge from-layer="42" from-port="2" to-layer="47" to-port="0" />
<edge from-layer="43" from-port="0" to-layer="47" to-port="1" />
<edge from-layer="44" from-port="0" to-layer="47" to-port="2" />
<edge from-layer="45" from-port="0" to-layer="47" to-port="3" />
<edge from-layer="46" from-port="0" to-layer="47" to-port="4" />
<edge from-layer="47" from-port="5" to-layer="52" to-port="0" />
<edge from-layer="47" from-port="5" to-layer="68" to-port="0" />
<edge from-layer="47" from-port="5" to-layer="84" to-port="0" />
<edge from-layer="48" from-port="0" to-layer="49" to-port="0" />
<edge from-layer="49" from-port="1" to-layer="51" to-port="0" />
<edge from-layer="50" from-port="0" to-layer="51" to-port="1" />
<edge from-layer="51" from-port="2" to-layer="52" to-port="1" />
<edge from-layer="52" from-port="2" to-layer="54" to-port="0" />
<edge from-layer="53" from-port="0" to-layer="54" to-port="1" />
<edge from-layer="54" from-port="2" to-layer="59" to-port="0" />
<edge from-layer="55" from-port="0" to-layer="59" to-port="1" />
<edge from-layer="56" from-port="0" to-layer="59" to-port="2" />
<edge from-layer="57" from-port="0" to-layer="59" to-port="3" />
<edge from-layer="58" from-port="0" to-layer="59" to-port="4" />
<edge from-layer="59" from-port="5" to-layer="61" to-port="0" />
<edge from-layer="60" from-port="0" to-layer="61" to-port="1" />
<edge from-layer="61" from-port="2" to-layer="63" to-port="0" />
<edge from-layer="62" from-port="0" to-layer="63" to-port="1" />
<edge from-layer="63" from-port="2" to-layer="112" to-port="0" />
<edge from-layer="64" from-port="0" to-layer="65" to-port="0" />
<edge from-layer="65" from-port="1" to-layer="67" to-port="0" />
<edge from-layer="66" from-port="0" to-layer="67" to-port="1" />
<edge from-layer="67" from-port="2" to-layer="68" to-port="1" />
<edge from-layer="68" from-port="2" to-layer="70" to-port="0" />
<edge from-layer="69" from-port="0" to-layer="70" to-port="1" />
<edge from-layer="70" from-port="2" to-layer="75" to-port="0" />
<edge from-layer="71" from-port="0" to-layer="75" to-port="1" />
<edge from-layer="72" from-port="0" to-layer="75" to-port="2" />
<edge from-layer="73" from-port="0" to-layer="75" to-port="3" />
<edge from-layer="74" from-port="0" to-layer="75" to-port="4" />
<edge from-layer="75" from-port="5" to-layer="77" to-port="0" />
<edge from-layer="76" from-port="0" to-layer="77" to-port="1" />
<edge from-layer="77" from-port="2" to-layer="79" to-port="0" />
<edge from-layer="78" from-port="0" to-layer="79" to-port="1" />
<edge from-layer="79" from-port="2" to-layer="112" to-port="1" />
<edge from-layer="80" from-port="0" to-layer="81" to-port="0" />
<edge from-layer="81" from-port="1" to-layer="83" to-port="0" />
<edge from-layer="82" from-port="0" to-layer="83" to-port="1" />
<edge from-layer="83" from-port="2" to-layer="84" to-port="1" />
<edge from-layer="84" from-port="2" to-layer="86" to-port="0" />
<edge from-layer="85" from-port="0" to-layer="86" to-port="1" />
<edge from-layer="86" from-port="2" to-layer="88" to-port="0" />
<edge from-layer="87" from-port="0" to-layer="88" to-port="1" />
<edge from-layer="88" from-port="2" to-layer="90" to-port="0" />
<edge from-layer="89" from-port="0" to-layer="90" to-port="1" />
<edge from-layer="90" from-port="2" to-layer="112" to-port="2" />
<edge from-layer="91" from-port="0" to-layer="108" to-port="0" />
<edge from-layer="92" from-port="0" to-layer="93" to-port="1" />
<edge from-layer="92" from-port="0" to-layer="511" to-port="2" />
<edge from-layer="93" from-port="2" to-layer="95" to-port="0" />
<edge from-layer="94" from-port="0" to-layer="95" to-port="1" />
<edge from-layer="95" from-port="2" to-layer="104" to-port="0" />
<edge from-layer="96" from-port="0" to-layer="98" to-port="1" />
<edge from-layer="97" from-port="0" to-layer="98" to-port="2" />
<edge from-layer="98" from-port="3" to-layer="103" to-port="0" />
<edge from-layer="99" from-port="0" to-layer="103" to-port="1" />
<edge from-layer="100" from-port="0" to-layer="102" to-port="1" />
<edge from-layer="101" from-port="0" to-layer="102" to-port="2" />
<edge from-layer="102" from-port="3" to-layer="103" to-port="2" />
<edge from-layer="103" from-port="3" to-layer="104" to-port="1" />
<edge from-layer="104" from-port="2" to-layer="105" to-port="0" />
<edge from-layer="105" from-port="1" to-layer="107" to-port="0" />
<edge from-layer="106" from-port="0" to-layer="107" to-port="1" />
<edge from-layer="107" from-port="2" to-layer="108" to-port="1" />
<edge from-layer="108" from-port="2" to-layer="111" to-port="2" />
<edge from-layer="108" from-port="2" to-layer="109" to-port="0" />
<edge from-layer="109" from-port="1" to-layer="111" to-port="0" />
<edge from-layer="110" from-port="0" to-layer="111" to-port="1" />
<edge from-layer="111" from-port="3" to-layer="112" to-port="3" />
<edge from-layer="111" from-port="3" to-layer="448" to-port="3" />
<edge from-layer="111" from-port="3" to-layer="224" to-port="3" />
<edge from-layer="111" from-port="3" to-layer="336" to-port="3" />
<edge from-layer="112" from-port="4" to-layer="114" to-port="0" />
<edge from-layer="113" from-port="0" to-layer="114" to-port="1" />
<edge from-layer="114" from-port="2" to-layer="116" to-port="0" />
<edge from-layer="115" from-port="0" to-layer="116" to-port="1" />
<edge from-layer="116" from-port="2" to-layer="118" to-port="0" />
<edge from-layer="117" from-port="0" to-layer="118" to-port="1" />
<edge from-layer="118" from-port="2" to-layer="123" to-port="0" />
<edge from-layer="119" from-port="0" to-layer="123" to-port="1" />
<edge from-layer="120" from-port="0" to-layer="123" to-port="2" />
<edge from-layer="121" from-port="0" to-layer="123" to-port="3" />
<edge from-layer="122" from-port="0" to-layer="123" to-port="4" />
<edge from-layer="123" from-port="5" to-layer="128" to-port="0" />
<edge from-layer="124" from-port="0" to-layer="125" to-port="0" />
<edge from-layer="125" from-port="1" to-layer="127" to-port="0" />
<edge from-layer="126" from-port="0" to-layer="127" to-port="1" />
<edge from-layer="127" from-port="2" to-layer="128" to-port="1" />
<edge from-layer="128" from-port="2" to-layer="130" to-port="0" />
<edge from-layer="129" from-port="0" to-layer="130" to-port="1" />
<edge from-layer="130" from-port="2" to-layer="131" to-port="0" />
<edge from-layer="131" from-port="2" to-layer="133" to-port="0" />
<edge from-layer="132" from-port="0" to-layer="133" to-port="1" />
<edge from-layer="133" from-port="2" to-layer="135" to-port="0" />
<edge from-layer="134" from-port="0" to-layer="135" to-port="1" />
<edge from-layer="135" from-port="2" to-layer="137" to-port="0" />
<edge from-layer="136" from-port="0" to-layer="137" to-port="1" />
<edge from-layer="137" from-port="2" to-layer="139" to-port="0" />
<edge from-layer="137" from-port="2" to-layer="167" to-port="1" />
<edge from-layer="138" from-port="0" to-layer="139" to-port="1" />
<edge from-layer="139" from-port="2" to-layer="144" to-port="0" />
<edge from-layer="140" from-port="0" to-layer="144" to-port="1" />
<edge from-layer="141" from-port="0" to-layer="144" to-port="2" />
<edge from-layer="142" from-port="0" to-layer="144" to-port="3" />
<edge from-layer="143" from-port="0" to-layer="144" to-port="4" />
<edge from-layer="144" from-port="5" to-layer="149" to-port="0" />
<edge from-layer="145" from-port="0" to-layer="146" to-port="0" />
<edge from-layer="146" from-port="1" to-layer="148" to-port="0" />
<edge from-layer="147" from-port="0" to-layer="148" to-port="1" />
<edge from-layer="148" from-port="2" to-layer="149" to-port="1" />
<edge from-layer="149" from-port="2" to-layer="151" to-port="0" />
<edge from-layer="150" from-port="0" to-layer="151" to-port="1" />
<edge from-layer="151" from-port="2" to-layer="152" to-port="0" />
<edge from-layer="152" from-port="1" to-layer="154" to-port="0" />
<edge from-layer="153" from-port="0" to-layer="154" to-port="1" />
<edge from-layer="154" from-port="2" to-layer="159" to-port="0" />
<edge from-layer="155" from-port="0" to-layer="159" to-port="1" />
<edge from-layer="156" from-port="0" to-layer="159" to-port="2" />
<edge from-layer="157" from-port="0" to-layer="159" to-port="3" />
<edge from-layer="158" from-port="0" to-layer="159" to-port="4" />
<edge from-layer="159" from-port="5" to-layer="164" to-port="0" />
<edge from-layer="160" from-port="0" to-layer="161" to-port="0" />
<edge from-layer="161" from-port="1" to-layer="163" to-port="0" />
<edge from-layer="162" from-port="0" to-layer="163" to-port="1" />
<edge from-layer="163" from-port="2" to-layer="164" to-port="1" />
<edge from-layer="164" from-port="2" to-layer="166" to-port="0" />
<edge from-layer="165" from-port="0" to-layer="166" to-port="1" />
<edge from-layer="166" from-port="2" to-layer="167" to-port="0" />
<edge from-layer="167" from-port="2" to-layer="169" to-port="0" />
<edge from-layer="168" from-port="0" to-layer="169" to-port="1" />
<edge from-layer="169" from-port="2" to-layer="171" to-port="0" />
<edge from-layer="170" from-port="0" to-layer="171" to-port="1" />
<edge from-layer="171" from-port="2" to-layer="173" to-port="0" />
<edge from-layer="172" from-port="0" to-layer="173" to-port="1" />
<edge from-layer="173" from-port="2" to-layer="243" to-port="1" />
<edge from-layer="173" from-port="2" to-layer="175" to-port="0" />
<edge from-layer="174" from-port="0" to-layer="175" to-port="1" />
<edge from-layer="175" from-port="2" to-layer="180" to-port="0" />
<edge from-layer="176" from-port="0" to-layer="180" to-port="1" />
<edge from-layer="177" from-port="0" to-layer="180" to-port="2" />
<edge from-layer="178" from-port="0" to-layer="180" to-port="3" />
<edge from-layer="179" from-port="0" to-layer="180" to-port="4" />
<edge from-layer="180" from-port="5" to-layer="185" to-port="0" />
<edge from-layer="180" from-port="5" to-layer="201" to-port="0" />
<edge from-layer="180" from-port="5" to-layer="217" to-port="0" />
<edge from-layer="181" from-port="0" to-layer="182" to-port="0" />
<edge from-layer="182" from-port="1" to-layer="184" to-port="0" />
<edge from-layer="183" from-port="0" to-layer="184" to-port="1" />
<edge from-layer="184" from-port="2" to-layer="185" to-port="1" />
<edge from-layer="185" from-port="2" to-layer="187" to-port="0" />
<edge from-layer="186" from-port="0" to-layer="187" to-port="1" />
<edge from-layer="187" from-port="2" to-layer="192" to-port="0" />
<edge from-layer="188" from-port="0" to-layer="192" to-port="1" />
<edge from-layer="189" from-port="0" to-layer="192" to-port="2" />
<edge from-layer="190" from-port="0" to-layer="192" to-port="3" />
<edge from-layer="191" from-port="0" to-layer="192" to-port="4" />
<edge from-layer="192" from-port="5" to-layer="194" to-port="0" />
<edge from-layer="193" from-port="0" to-layer="194" to-port="1" />
<edge from-layer="194" from-port="2" to-layer="196" to-port="0" />
<edge from-layer="195" from-port="0" to-layer="196" to-port="1" />
<edge from-layer="196" from-port="2" to-layer="224" to-port="0" />
<edge from-layer="197" from-port="0" to-layer="198" to-port="0" />
<edge from-layer="198" from-port="1" to-layer="200" to-port="0" />
<edge from-layer="199" from-port="0" to-layer="200" to-port="1" />
<edge from-layer="200" from-port="2" to-layer="201" to-port="1" />
<edge from-layer="201" from-port="2" to-layer="203" to-port="0" />
<edge from-layer="202" from-port="0" to-layer="203" to-port="1" />
<edge from-layer="203" from-port="2" to-layer="208" to-port="0" />
<edge from-layer="204" from-port="0" to-layer="208" to-port="1" />
<edge from-layer="205" from-port="0" to-layer="208" to-port="2" />
<edge from-layer="206" from-port="0" to-layer="208" to-port="3" />
<edge from-layer="207" from-port="0" to-layer="208" to-port="4" />
<edge from-layer="208" from-port="5" to-layer="210" to-port="0" />
<edge from-layer="209" from-port="0" to-layer="210" to-port="1" />
<edge from-layer="210" from-port="2" to-layer="212" to-port="0" />
<edge from-layer="211" from-port="0" to-layer="212" to-port="1" />
<edge from-layer="212" from-port="2" to-layer="224" to-port="1" />
<edge from-layer="213" from-port="0" to-layer="214" to-port="0" />
<edge from-layer="214" from-port="1" to-layer="216" to-port="0" />
<edge from-layer="215" from-port="0" to-layer="216" to-port="1" />
<edge from-layer="216" from-port="2" to-layer="217" to-port="1" />
<edge from-layer="217" from-port="2" to-layer="219" to-port="0" />
<edge from-layer="218" from-port="0" to-layer="219" to-port="1" />
<edge from-layer="219" from-port="2" to-layer="221" to-port="0" />
<edge from-layer="220" from-port="0" to-layer="221" to-port="1" />
<edge from-layer="221" from-port="2" to-layer="223" to-port="0" />
<edge from-layer="222" from-port="0" to-layer="223" to-port="1" />
<edge from-layer="223" from-port="2" to-layer="224" to-port="2" />
<edge from-layer="224" from-port="4" to-layer="226" to-port="0" />
<edge from-layer="225" from-port="0" to-layer="226" to-port="1" />
<edge from-layer="226" from-port="2" to-layer="228" to-port="0" />
<edge from-layer="227" from-port="0" to-layer="228" to-port="1" />
<edge from-layer="228" from-port="2" to-layer="230" to-port="0" />
<edge from-layer="229" from-port="0" to-layer="230" to-port="1" />
<edge from-layer="230" from-port="2" to-layer="235" to-port="0" />
<edge from-layer="231" from-port="0" to-layer="235" to-port="1" />
<edge from-layer="232" from-port="0" to-layer="235" to-port="2" />
<edge from-layer="233" from-port="0" to-layer="235" to-port="3" />
<edge from-layer="234" from-port="0" to-layer="235" to-port="4" />
<edge from-layer="235" from-port="5" to-layer="240" to-port="0" />
<edge from-layer="236" from-port="0" to-layer="237" to-port="0" />
<edge from-layer="237" from-port="1" to-layer="239" to-port="0" />
<edge from-layer="238" from-port="0" to-layer="239" to-port="1" />
<edge from-layer="239" from-port="2" to-layer="240" to-port="1" />
<edge from-layer="240" from-port="2" to-layer="242" to-port="0" />
<edge from-layer="241" from-port="0" to-layer="242" to-port="1" />
<edge from-layer="242" from-port="2" to-layer="243" to-port="0" />
<edge from-layer="243" from-port="2" to-layer="245" to-port="0" />
<edge from-layer="244" from-port="0" to-layer="245" to-port="1" />
<edge from-layer="245" from-port="2" to-layer="247" to-port="0" />
<edge from-layer="246" from-port="0" to-layer="247" to-port="1" />
<edge from-layer="247" from-port="2" to-layer="249" to-port="0" />
<edge from-layer="248" from-port="0" to-layer="249" to-port="1" />
<edge from-layer="249" from-port="2" to-layer="251" to-port="0" />
<edge from-layer="249" from-port="2" to-layer="279" to-port="1" />
<edge from-layer="250" from-port="0" to-layer="251" to-port="1" />
<edge from-layer="251" from-port="2" to-layer="256" to-port="0" />
<edge from-layer="252" from-port="0" to-layer="256" to-port="1" />
<edge from-layer="253" from-port="0" to-layer="256" to-port="2" />
<edge from-layer="254" from-port="0" to-layer="256" to-port="3" />
<edge from-layer="255" from-port="0" to-layer="256" to-port="4" />
<edge from-layer="256" from-port="5" to-layer="261" to-port="0" />
<edge from-layer="257" from-port="0" to-layer="258" to-port="0" />
<edge from-layer="258" from-port="1" to-layer="260" to-port="0" />
<edge from-layer="259" from-port="0" to-layer="260" to-port="1" />
<edge from-layer="260" from-port="2" to-layer="261" to-port="1" />
<edge from-layer="261" from-port="2" to-layer="263" to-port="0" />
<edge from-layer="262" from-port="0" to-layer="263" to-port="1" />
<edge from-layer="263" from-port="2" to-layer="264" to-port="0" />
<edge from-layer="264" from-port="1" to-layer="266" to-port="0" />
<edge from-layer="265" from-port="0" to-layer="266" to-port="1" />
<edge from-layer="266" from-port="2" to-layer="271" to-port="0" />
<edge from-layer="267" from-port="0" to-layer="271" to-port="1" />
<edge from-layer="268" from-port="0" to-layer="271" to-port="2" />
<edge from-layer="269" from-port="0" to-layer="271" to-port="3" />
<edge from-layer="270" from-port="0" to-layer="271" to-port="4" />
<edge from-layer="271" from-port="5" to-layer="276" to-port="0" />
<edge from-layer="272" from-port="0" to-layer="273" to-port="0" />
<edge from-layer="273" from-port="1" to-layer="275" to-port="0" />
<edge from-layer="274" from-port="0" to-layer="275" to-port="1" />
<edge from-layer="275" from-port="2" to-layer="276" to-port="1" />
<edge from-layer="276" from-port="2" to-layer="278" to-port="0" />
<edge from-layer="277" from-port="0" to-layer="278" to-port="1" />
<edge from-layer="278" from-port="2" to-layer="279" to-port="0" />
<edge from-layer="279" from-port="2" to-layer="281" to-port="0" />
<edge from-layer="280" from-port="0" to-layer="281" to-port="1" />
<edge from-layer="281" from-port="2" to-layer="283" to-port="0" />
<edge from-layer="282" from-port="0" to-layer="283" to-port="1" />
<edge from-layer="283" from-port="2" to-layer="285" to-port="0" />
<edge from-layer="284" from-port="0" to-layer="285" to-port="1" />
<edge from-layer="285" from-port="2" to-layer="287" to-port="0" />
<edge from-layer="285" from-port="2" to-layer="355" to-port="1" />
<edge from-layer="286" from-port="0" to-layer="287" to-port="1" />
<edge from-layer="287" from-port="2" to-layer="292" to-port="0" />
<edge from-layer="288" from-port="0" to-layer="292" to-port="1" />
<edge from-layer="289" from-port="0" to-layer="292" to-port="2" />
<edge from-layer="290" from-port="0" to-layer="292" to-port="3" />
<edge from-layer="291" from-port="0" to-layer="292" to-port="4" />
<edge from-layer="292" from-port="5" to-layer="297" to-port="0" />
<edge from-layer="292" from-port="5" to-layer="313" to-port="0" />
<edge from-layer="292" from-port="5" to-layer="329" to-port="0" />
<edge from-layer="293" from-port="0" to-layer="294" to-port="0" />
<edge from-layer="294" from-port="1" to-layer="296" to-port="0" />
<edge from-layer="295" from-port="0" to-layer="296" to-port="1" />
<edge from-layer="296" from-port="2" to-layer="297" to-port="1" />
<edge from-layer="297" from-port="2" to-layer="299" to-port="0" />
<edge from-layer="298" from-port="0" to-layer="299" to-port="1" />
<edge from-layer="299" from-port="2" to-layer="304" to-port="0" />
<edge from-layer="300" from-port="0" to-layer="304" to-port="1" />
<edge from-layer="301" from-port="0" to-layer="304" to-port="2" />
<edge from-layer="302" from-port="0" to-layer="304" to-port="3" />
<edge from-layer="303" from-port="0" to-layer="304" to-port="4" />
<edge from-layer="304" from-port="5" to-layer="306" to-port="0" />
<edge from-layer="305" from-port="0" to-layer="306" to-port="1" />
<edge from-layer="306" from-port="2" to-layer="308" to-port="0" />
<edge from-layer="307" from-port="0" to-layer="308" to-port="1" />
<edge from-layer="308" from-port="2" to-layer="336" to-port="0" />
<edge from-layer="309" from-port="0" to-layer="310" to-port="0" />
<edge from-layer="310" from-port="1" to-layer="312" to-port="0" />
<edge from-layer="311" from-port="0" to-layer="312" to-port="1" />
<edge from-layer="312" from-port="2" to-layer="313" to-port="1" />
<edge from-layer="313" from-port="2" to-layer="315" to-port="0" />
<edge from-layer="314" from-port="0" to-layer="315" to-port="1" />
<edge from-layer="315" from-port="2" to-layer="320" to-port="0" />
<edge from-layer="316" from-port="0" to-layer="320" to-port="1" />
<edge from-layer="317" from-port="0" to-layer="320" to-port="2" />
<edge from-layer="318" from-port="0" to-layer="320" to-port="3" />
<edge from-layer="319" from-port="0" to-layer="320" to-port="4" />
<edge from-layer="320" from-port="5" to-layer="322" to-port="0" />
<edge from-layer="321" from-port="0" to-layer="322" to-port="1" />
<edge from-layer="322" from-port="2" to-layer="324" to-port="0" />
<edge from-layer="323" from-port="0" to-layer="324" to-port="1" />
<edge from-layer="324" from-port="2" to-layer="336" to-port="1" />
<edge from-layer="325" from-port="0" to-layer="326" to-port="0" />
<edge from-layer="326" from-port="1" to-layer="328" to-port="0" />
<edge from-layer="327" from-port="0" to-layer="328" to-port="1" />
<edge from-layer="328" from-port="2" to-layer="329" to-port="1" />
<edge from-layer="329" from-port="2" to-layer="331" to-port="0" />
<edge from-layer="330" from-port="0" to-layer="331" to-port="1" />
<edge from-layer="331" from-port="2" to-layer="333" to-port="0" />
<edge from-layer="332" from-port="0" to-layer="333" to-port="1" />
<edge from-layer="333" from-port="2" to-layer="335" to-port="0" />
<edge from-layer="334" from-port="0" to-layer="335" to-port="1" />
<edge from-layer="335" from-port="2" to-layer="336" to-port="2" />
<edge from-layer="336" from-port="4" to-layer="338" to-port="0" />
<edge from-layer="337" from-port="0" to-layer="338" to-port="1" />
<edge from-layer="338" from-port="2" to-layer="340" to-port="0" />
<edge from-layer="339" from-port="0" to-layer="340" to-port="1" />
<edge from-layer="340" from-port="2" to-layer="342" to-port="0" />
<edge from-layer="341" from-port="0" to-layer="342" to-port="1" />
<edge from-layer="342" from-port="2" to-layer="347" to-port="0" />
<edge from-layer="343" from-port="0" to-layer="347" to-port="1" />
<edge from-layer="344" from-port="0" to-layer="347" to-port="2" />
<edge from-layer="345" from-port="0" to-layer="347" to-port="3" />
<edge from-layer="346" from-port="0" to-layer="347" to-port="4" />
<edge from-layer="347" from-port="5" to-layer="352" to-port="0" />
<edge from-layer="348" from-port="0" to-layer="349" to-port="0" />
<edge from-layer="349" from-port="1" to-layer="351" to-port="0" />
<edge from-layer="350" from-port="0" to-layer="351" to-port="1" />
<edge from-layer="351" from-port="2" to-layer="352" to-port="1" />
<edge from-layer="352" from-port="2" to-layer="354" to-port="0" />
<edge from-layer="353" from-port="0" to-layer="354" to-port="1" />
<edge from-layer="354" from-port="2" to-layer="355" to-port="0" />
<edge from-layer="355" from-port="2" to-layer="357" to-port="0" />
<edge from-layer="356" from-port="0" to-layer="357" to-port="1" />
<edge from-layer="357" from-port="2" to-layer="359" to-port="0" />
<edge from-layer="358" from-port="0" to-layer="359" to-port="1" />
<edge from-layer="359" from-port="2" to-layer="361" to-port="0" />
<edge from-layer="360" from-port="0" to-layer="361" to-port="1" />
<edge from-layer="361" from-port="2" to-layer="363" to-port="0" />
<edge from-layer="361" from-port="2" to-layer="391" to-port="1" />
<edge from-layer="362" from-port="0" to-layer="363" to-port="1" />
<edge from-layer="363" from-port="2" to-layer="368" to-port="0" />
<edge from-layer="364" from-port="0" to-layer="368" to-port="1" />
<edge from-layer="365" from-port="0" to-layer="368" to-port="2" />
<edge from-layer="366" from-port="0" to-layer="368" to-port="3" />
<edge from-layer="367" from-port="0" to-layer="368" to-port="4" />
<edge from-layer="368" from-port="5" to-layer="373" to-port="0" />
<edge from-layer="369" from-port="0" to-layer="370" to-port="0" />
<edge from-layer="370" from-port="1" to-layer="372" to-port="0" />
<edge from-layer="371" from-port="0" to-layer="372" to-port="1" />
<edge from-layer="372" from-port="2" to-layer="373" to-port="1" />
<edge from-layer="373" from-port="2" to-layer="375" to-port="0" />
<edge from-layer="374" from-port="0" to-layer="375" to-port="1" />
<edge from-layer="375" from-port="2" to-layer="376" to-port="0" />
<edge from-layer="376" from-port="1" to-layer="378" to-port="0" />
<edge from-layer="377" from-port="0" to-layer="378" to-port="1" />
<edge from-layer="378" from-port="2" to-layer="383" to-port="0" />
<edge from-layer="379" from-port="0" to-layer="383" to-port="1" />
<edge from-layer="380" from-port="0" to-layer="383" to-port="2" />
<edge from-layer="381" from-port="0" to-layer="383" to-port="3" />
<edge from-layer="382" from-port="0" to-layer="383" to-port="4" />
<edge from-layer="383" from-port="5" to-layer="388" to-port="0" />
<edge from-layer="384" from-port="0" to-layer="385" to-port="0" />
<edge from-layer="385" from-port="1" to-layer="387" to-port="0" />
<edge from-layer="386" from-port="0" to-layer="387" to-port="1" />
<edge from-layer="387" from-port="2" to-layer="388" to-port="1" />
<edge from-layer="388" from-port="2" to-layer="390" to-port="0" />
<edge from-layer="389" from-port="0" to-layer="390" to-port="1" />
<edge from-layer="390" from-port="2" to-layer="391" to-port="0" />
<edge from-layer="391" from-port="2" to-layer="393" to-port="0" />
<edge from-layer="392" from-port="0" to-layer="393" to-port="1" />
<edge from-layer="393" from-port="2" to-layer="395" to-port="0" />
<edge from-layer="394" from-port="0" to-layer="395" to-port="1" />
<edge from-layer="395" from-port="2" to-layer="397" to-port="0" />
<edge from-layer="396" from-port="0" to-layer="397" to-port="1" />
<edge from-layer="397" from-port="2" to-layer="399" to-port="0" />
<edge from-layer="397" from-port="2" to-layer="467" to-port="1" />
<edge from-layer="398" from-port="0" to-layer="399" to-port="1" />
<edge from-layer="399" from-port="2" to-layer="404" to-port="0" />
<edge from-layer="400" from-port="0" to-layer="404" to-port="1" />
<edge from-layer="401" from-port="0" to-layer="404" to-port="2" />
<edge from-layer="402" from-port="0" to-layer="404" to-port="3" />
<edge from-layer="403" from-port="0" to-layer="404" to-port="4" />
<edge from-layer="404" from-port="5" to-layer="409" to-port="0" />
<edge from-layer="404" from-port="5" to-layer="425" to-port="0" />
<edge from-layer="404" from-port="5" to-layer="441" to-port="0" />
<edge from-layer="405" from-port="0" to-layer="406" to-port="0" />
<edge from-layer="406" from-port="1" to-layer="408" to-port="0" />
<edge from-layer="407" from-port="0" to-layer="408" to-port="1" />
<edge from-layer="408" from-port="2" to-layer="409" to-port="1" />
<edge from-layer="409" from-port="2" to-layer="411" to-port="0" />
<edge from-layer="410" from-port="0" to-layer="411" to-port="1" />
<edge from-layer="411" from-port="2" to-layer="416" to-port="0" />
<edge from-layer="412" from-port="0" to-layer="416" to-port="1" />
<edge from-layer="413" from-port="0" to-layer="416" to-port="2" />
<edge from-layer="414" from-port="0" to-layer="416" to-port="3" />
<edge from-layer="415" from-port="0" to-layer="416" to-port="4" />
<edge from-layer="416" from-port="5" to-layer="418" to-port="0" />
<edge from-layer="417" from-port="0" to-layer="418" to-port="1" />
<edge from-layer="418" from-port="2" to-layer="420" to-port="0" />
<edge from-layer="419" from-port="0" to-layer="420" to-port="1" />
<edge from-layer="420" from-port="2" to-layer="448" to-port="0" />
<edge from-layer="421" from-port="0" to-layer="422" to-port="0" />
<edge from-layer="422" from-port="1" to-layer="424" to-port="0" />
<edge from-layer="423" from-port="0" to-layer="424" to-port="1" />
<edge from-layer="424" from-port="2" to-layer="425" to-port="1" />
<edge from-layer="425" from-port="2" to-layer="427" to-port="0" />
<edge from-layer="426" from-port="0" to-layer="427" to-port="1" />
<edge from-layer="427" from-port="2" to-layer="432" to-port="0" />
<edge from-layer="428" from-port="0" to-layer="432" to-port="1" />
<edge from-layer="429" from-port="0" to-layer="432" to-port="2" />
<edge from-layer="430" from-port="0" to-layer="432" to-port="3" />
<edge from-layer="431" from-port="0" to-layer="432" to-port="4" />
<edge from-layer="432" from-port="5" to-layer="434" to-port="0" />
<edge from-layer="433" from-port="0" to-layer="434" to-port="1" />
<edge from-layer="434" from-port="2" to-layer="436" to-port="0" />
<edge from-layer="435" from-port="0" to-layer="436" to-port="1" />
<edge from-layer="436" from-port="2" to-layer="448" to-port="1" />
<edge from-layer="437" from-port="0" to-layer="438" to-port="0" />
<edge from-layer="438" from-port="1" to-layer="440" to-port="0" />
<edge from-layer="439" from-port="0" to-layer="440" to-port="1" />
<edge from-layer="440" from-port="2" to-layer="441" to-port="1" />
<edge from-layer="441" from-port="2" to-layer="443" to-port="0" />
<edge from-layer="442" from-port="0" to-layer="443" to-port="1" />
<edge from-layer="443" from-port="2" to-layer="445" to-port="0" />
<edge from-layer="444" from-port="0" to-layer="445" to-port="1" />
<edge from-layer="445" from-port="2" to-layer="447" to-port="0" />
<edge from-layer="446" from-port="0" to-layer="447" to-port="1" />
<edge from-layer="447" from-port="2" to-layer="448" to-port="2" />
<edge from-layer="448" from-port="4" to-layer="450" to-port="0" />
<edge from-layer="449" from-port="0" to-layer="450" to-port="1" />
<edge from-layer="450" from-port="2" to-layer="452" to-port="0" />
<edge from-layer="451" from-port="0" to-layer="452" to-port="1" />
<edge from-layer="452" from-port="2" to-layer="454" to-port="0" />
<edge from-layer="453" from-port="0" to-layer="454" to-port="1" />
<edge from-layer="454" from-port="2" to-layer="459" to-port="0" />
<edge from-layer="455" from-port="0" to-layer="459" to-port="1" />
<edge from-layer="456" from-port="0" to-layer="459" to-port="2" />
<edge from-layer="457" from-port="0" to-layer="459" to-port="3" />
<edge from-layer="458" from-port="0" to-layer="459" to-port="4" />
<edge from-layer="459" from-port="5" to-layer="464" to-port="0" />
<edge from-layer="460" from-port="0" to-layer="461" to-port="0" />
<edge from-layer="461" from-port="1" to-layer="463" to-port="0" />
<edge from-layer="462" from-port="0" to-layer="463" to-port="1" />
<edge from-layer="463" from-port="2" to-layer="464" to-port="1" />
<edge from-layer="464" from-port="2" to-layer="466" to-port="0" />
<edge from-layer="465" from-port="0" to-layer="466" to-port="1" />
<edge from-layer="466" from-port="2" to-layer="467" to-port="0" />
<edge from-layer="467" from-port="2" to-layer="469" to-port="0" />
<edge from-layer="468" from-port="0" to-layer="469" to-port="1" />
<edge from-layer="469" from-port="2" to-layer="471" to-port="0" />
<edge from-layer="470" from-port="0" to-layer="471" to-port="1" />
<edge from-layer="471" from-port="2" to-layer="473" to-port="0" />
<edge from-layer="472" from-port="0" to-layer="473" to-port="1" />
<edge from-layer="473" from-port="2" to-layer="475" to-port="0" />
<edge from-layer="473" from-port="2" to-layer="503" to-port="1" />
<edge from-layer="474" from-port="0" to-layer="475" to-port="1" />
<edge from-layer="475" from-port="2" to-layer="480" to-port="0" />
<edge from-layer="476" from-port="0" to-layer="480" to-port="1" />
<edge from-layer="477" from-port="0" to-layer="480" to-port="2" />
<edge from-layer="478" from-port="0" to-layer="480" to-port="3" />
<edge from-layer="479" from-port="0" to-layer="480" to-port="4" />
<edge from-layer="480" from-port="5" to-layer="485" to-port="0" />
<edge from-layer="481" from-port="0" to-layer="482" to-port="0" />
<edge from-layer="482" from-port="1" to-layer="484" to-port="0" />
<edge from-layer="483" from-port="0" to-layer="484" to-port="1" />
<edge from-layer="484" from-port="2" to-layer="485" to-port="1" />
<edge from-layer="485" from-port="2" to-layer="487" to-port="0" />
<edge from-layer="486" from-port="0" to-layer="487" to-port="1" />
<edge from-layer="487" from-port="2" to-layer="488" to-port="0" />
<edge from-layer="488" from-port="1" to-layer="490" to-port="0" />
<edge from-layer="489" from-port="0" to-layer="490" to-port="1" />
<edge from-layer="490" from-port="2" to-layer="495" to-port="0" />
<edge from-layer="491" from-port="0" to-layer="495" to-port="1" />
<edge from-layer="492" from-port="0" to-layer="495" to-port="2" />
<edge from-layer="493" from-port="0" to-layer="495" to-port="3" />
<edge from-layer="494" from-port="0" to-layer="495" to-port="4" />
<edge from-layer="495" from-port="5" to-layer="500" to-port="0" />
<edge from-layer="496" from-port="0" to-layer="497" to-port="0" />
<edge from-layer="497" from-port="1" to-layer="499" to-port="0" />
<edge from-layer="498" from-port="0" to-layer="499" to-port="1" />
<edge from-layer="499" from-port="2" to-layer="500" to-port="1" />
<edge from-layer="500" from-port="2" to-layer="502" to-port="0" />
<edge from-layer="501" from-port="0" to-layer="502" to-port="1" />
<edge from-layer="502" from-port="2" to-layer="503" to-port="0" />
<edge from-layer="503" from-port="2" to-layer="505" to-port="0" />
<edge from-layer="504" from-port="0" to-layer="505" to-port="1" />
<edge from-layer="505" from-port="2" to-layer="507" to-port="0" />
<edge from-layer="506" from-port="0" to-layer="507" to-port="1" />
<edge from-layer="507" from-port="2" to-layer="509" to-port="0" />
<edge from-layer="508" from-port="0" to-layer="509" to-port="1" />
<edge from-layer="509" from-port="2" to-layer="511" to-port="0" />
<edge from-layer="510" from-port="0" to-layer="511" to-port="1" />
<edge from-layer="511" from-port="3" to-layer="513" to-port="0" />
<edge from-layer="512" from-port="0" to-layer="513" to-port="1" />
<edge from-layer="513" from-port="2" to-layer="518" to-port="0" />
<edge from-layer="514" from-port="0" to-layer="518" to-port="1" />
<edge from-layer="515" from-port="0" to-layer="518" to-port="2" />
<edge from-layer="516" from-port="0" to-layer="518" to-port="3" />
<edge from-layer="517" from-port="0" to-layer="518" to-port="4" />
<edge from-layer="518" from-port="5" to-layer="523" to-port="0" />
<edge from-layer="519" from-port="0" to-layer="520" to-port="0" />
<edge from-layer="520" from-port="1" to-layer="522" to-port="0" />
<edge from-layer="521" from-port="0" to-layer="522" to-port="1" />
<edge from-layer="522" from-port="2" to-layer="523" to-port="1" />
<edge from-layer="523" from-port="2" to-layer="525" to-port="0" />
<edge from-layer="524" from-port="0" to-layer="525" to-port="1" />
<edge from-layer="525" from-port="2" to-layer="526" to-port="0" />
<edge from-layer="526" from-port="1" to-layer="528" to-port="0" />
<edge from-layer="527" from-port="0" to-layer="528" to-port="1" />
<edge from-layer="528" from-port="2" to-layer="533" to-port="0" />
<edge from-layer="529" from-port="0" to-layer="533" to-port="1" />
<edge from-layer="530" from-port="0" to-layer="533" to-port="2" />
<edge from-layer="531" from-port="0" to-layer="533" to-port="3" />
<edge from-layer="532" from-port="0" to-layer="533" to-port="4" />
<edge from-layer="533" from-port="5" to-layer="538" to-port="0" />
<edge from-layer="534" from-port="0" to-layer="535" to-port="0" />
<edge from-layer="535" from-port="1" to-layer="537" to-port="0" />
<edge from-layer="536" from-port="0" to-layer="537" to-port="1" />
<edge from-layer="537" from-port="2" to-layer="538" to-port="1" />
<edge from-layer="538" from-port="2" to-layer="540" to-port="0" />
<edge from-layer="539" from-port="0" to-layer="540" to-port="1" />
<edge from-layer="540" from-port="2" to-layer="541" to-port="0" />
</edges>
<rt_info>
<Runtime_version value="2024.4.1-16618-643f23d1318-releases/2024/4" />
<conversion_parameters>
<framework value="pytorch" />
<is_python_object value="True" />
</conversion_parameters>
<nncf>
<friendly_names_were_updated value="True" />
<quantization>
<advanced_parameters value="{'overflow_fix': 'disable', 'quantize_outputs': False, 'inplace_statistics': True, 'disable_channel_alignment': True, 'disable_bias_correction': False, 'batchwise_statistics': None, 'activations_quantization_params': None, 'weights_quantization_params': None, 'activations_range_estimator_params': {'min': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}, 'max': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}}, 'weights_range_estimator_params': {'min': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}, 'max': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}}, 'bias_correction_params': {'apply_for_all_nodes': False, 'threshold': None}, 'smooth_quant_alphas': {'convolution': -1, 'matmul': 0.95}, 'smooth_quant_alpha': None, 'backend_params': {}}" />
<fast_bias_correction value="True" />
<ignored_scope>
<types value="['GroupNormalization']" />
</ignored_scope>
<model_type value="transformer" />
<preset value="mixed" />
<subset_size value="300" />
<target_device value="ANY" />
</quantization>
</nncf>
<optimum>
<optimum_intel_version value="1.20.1" />
<optimum_version value="1.24.0" />
<pytorch_version value="2.6.0+cu124" />
<transformers_version value="4.52.0.dev0" />
</optimum>
</rt_info>
</net>