| <?xml version="1.0"?>
|
| <net name="Model1564" version="11">
|
| <layers>
|
| <layer id="1" name="input_ids" type="Parameter" version="opset1">
|
| <data shape="?,?" element_type="i64" />
|
| <output>
|
| <port id="0" precision="I64" names="input_ids">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="0" name="attention_mask" type="Parameter" version="opset1">
|
| <data shape="?,?" element_type="i64" />
|
| <output>
|
| <port id="0" precision="I64" names="attention_mask">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="2" name="Constant_1827270" type="Const" version="opset1">
|
| <data element_type="i8" shape="50265, 768" offset="0" size="38603520" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>50265</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="3" name="Convert_1827271" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>50265</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>50265</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="4" name="Constant_1827272" type="Const" version="opset1">
|
| <data element_type="f32" shape="50265, 1" offset="38603520" size="201060" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>50265</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="5" name="__module.roberta.embeddings.word_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>50265</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>50265</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>50265</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="6" name="__module.roberta.embeddings.word_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
|
| <data destination_type="i32" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="7" name="__module.roberta.embeddings.word_embeddings/aten::embedding/Constant" type="Const" version="opset1">
|
| <data element_type="i32" shape="" offset="38804580" size="4" />
|
| <output>
|
| <port id="0" precision="I32" />
|
| </output>
|
| </layer>
|
| <layer id="8" name="__module.roberta.embeddings.word_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>50265</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="2" precision="I32" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="54,inputs_embeds">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="9" name="Constant_1827274" type="Const" version="opset1">
|
| <data element_type="i8" shape="1, 768" offset="38804584" size="768" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="10" name="Convert_1827275" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="11" name="Constant_1827276" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1" offset="38805352" size="4" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="12" name="__module.roberta.embeddings.token_type_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="13" name="__module.roberta/aten::slice/Slice" type="Const" version="opset1">
|
| <data element_type="i64" shape="1, 514" offset="38805356" size="4112" />
|
| <output>
|
| <port id="0" precision="I64" names="37">
|
| <dim>1</dim>
|
| <dim>514</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="14" name="__module.roberta/aten::slice/Reshape" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="38809468" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="15" name="__module.roberta/aten::size/ShapeOf_1" type="ShapeOf" version="opset3">
|
| <data output_type="i64" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="I64" names="39">
|
| <dim>2</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="16" name="Constant_1612273" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="38809476" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="17" name="Constant_1612274" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="38809468" size="8" />
|
| <output>
|
| <port id="0" precision="I64" />
|
| </output>
|
| </layer>
|
| <layer id="18" name="Gather_1612275" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>2</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="I64" names="36,67">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="19" name="__module.roberta/aten::slice/Reshape_2" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="38809476" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="20" name="__module.roberta/aten::slice/Reshape_3" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="38809476" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="21" name="__module.roberta/aten::slice/Slice_1" type="Slice" version="opset8">
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| <dim>514</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="2" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="3" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="4" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="5" precision="I64" names="38,buffered_token_type_ids">
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="22" name="__module.roberta/aten::expand/Broadcast" type="Broadcast" version="opset3">
|
| <data mode="bidirectional" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>2</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="I64" names="40">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="23" name="__module.roberta.embeddings.token_type_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
|
| <data destination_type="i32" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="24" name="__module.roberta.embeddings.token_type_embeddings/aten::embedding/Constant" type="Const" version="opset1">
|
| <data element_type="i32" shape="" offset="38804580" size="4" />
|
| <output>
|
| <port id="0" precision="I32" />
|
| </output>
|
| </layer>
|
| <layer id="25" name="__module.roberta.embeddings.token_type_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="2" precision="I32" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="56,token_type_embeddings.1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="26" name="__module.roberta.embeddings/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="57_1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="27" name="Constant_1827278" type="Const" version="opset1">
|
| <data element_type="i8" shape="514, 768" offset="38809484" size="394752" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>514</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="28" name="Convert_1827279" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>514</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>514</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="29" name="Constant_1827280" type="Const" version="opset1">
|
| <data element_type="f32" shape="514, 1" offset="39204236" size="2056" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>514</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="30" name="__module.roberta.embeddings.position_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>514</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>514</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>514</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="31" name="Constant_1612144" type="Const" version="opset1">
|
| <data element_type="i64" shape="1, 1" offset="38809476" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="32" name="__module.roberta.embeddings/aten::ne/NotEqual" type="NotEqual" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="BOOL" names="45">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="33" name="__module.roberta.embeddings/aten::to/Convert" type="Convert" version="opset1">
|
| <data destination_type="i32" />
|
| <input>
|
| <port id="0" precision="BOOL">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="I32" names="46,mask">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="34" name="29" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="38809476" size="8" />
|
| <output>
|
| <port id="0" precision="I64" names="29" />
|
| </output>
|
| </layer>
|
| <layer id="35" name="__module.roberta.embeddings/aten::cumsum/CumSum" type="CumSum" version="opset3">
|
| <data exclusive="false" reverse="false" />
|
| <input>
|
| <port id="0" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="2" precision="I32" names="47,48,49">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="36" name="__module.roberta.embeddings/aten::mul/Multiply" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="I32" names="50,incremental_indices">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="37" name="__module.roberta.embeddings/aten::to/Convert_1" type="Convert" version="opset1">
|
| <data destination_type="i64" />
|
| <input>
|
| <port id="0" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="I64" names="51">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="38" name="Constant_1612145" type="Const" version="opset1">
|
| <data element_type="i64" shape="1, 1" offset="38809476" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="39" name="__module.roberta.embeddings/aten::add/Add_2" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="I64" names="52">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="40" name="__module.roberta.embeddings.position_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
|
| <data destination_type="i32" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="41" name="__module.roberta.embeddings.position_embeddings/aten::embedding/Constant" type="Const" version="opset1">
|
| <data element_type="i32" shape="" offset="38804580" size="4" />
|
| <output>
|
| <port id="0" precision="I32" />
|
| </output>
|
| </layer>
|
| <layer id="42" name="__module.roberta.embeddings.position_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>514</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="2" precision="I32" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="59,position_embeddings.1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="43" name="__module.roberta.embeddings/aten::add_/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="57,embeddings.1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="44" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="45" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="46" name="Constant_1612146" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="39206296" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="47" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="48" name="Constant_1612147" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="39209368" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="49" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="64,input.1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="50" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="39212440" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="51" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="52" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="39215512" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="53" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="39215516" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="54" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="39215512" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="55" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="39215516" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="56" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="57" name="Constant_1827282" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="39215520" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="58" name="Convert_1827283" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="59" name="Constant_1827284" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="39805344" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="60" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="61" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="62" name="Constant_1612148" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="39808416" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="63" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="102,x.1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="64" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="39811488" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="65" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="39811492" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="66" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="39811488" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="67" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="39811492" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="68" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="69" name="__module.roberta.encoder.layer.0.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="70" name="__module.roberta.encoder.layer.0.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="106,x.3">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="71" name="Constant_1607017" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="107">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="72" name="__module.roberta.encoder.layer.0.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="108">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="73" name="Constant_1827286" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="39811560" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="74" name="Convert_1827287" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="75" name="Constant_1827288" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="40401384" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="76" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="77" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="78" name="Constant_1612149" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="40404456" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="79" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="111,x.5">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="80" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="40407528" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="81" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="40407532" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="82" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="40407528" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="83" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="40407532" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="84" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="85" name="__module.roberta.encoder.layer.0.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="86" name="__module.roberta.encoder.layer.0.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="115,x.7">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="87" name="Constant_1607040" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="116">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="88" name="__module.roberta.encoder.layer.0.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="117">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="89" name="Constant_1827290" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="40407536" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="90" name="Convert_1827291" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="91" name="Constant_1827292" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="40997360" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="92" name="__module.roberta.encoder.layer.0.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="93" name="__module.roberta.encoder.layer.0.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="94" name="Constant_1612150" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="41000432" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="95" name="__module.roberta.encoder.layer.0.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="120,x.9">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="96" name="__module.roberta.encoder.layer.0.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="97" name="__module.roberta.encoder.layer.0.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="124,x.11">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="98" name="Constant_1607063" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="125">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="99" name="__module.roberta.encoder.layer.0.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="126">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="100" name="Constant_1612152" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 1, 1" offset="41003504" size="4" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="101" name="__module.roberta/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1">
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="2" precision="I64" names="69">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="102" name="16" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="41003508" size="8" />
|
| <output>
|
| <port id="0" precision="I64" names="16" />
|
| </output>
|
| </layer>
|
| <layer id="103" name="__module.roberta/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1">
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="2" precision="I64" names="70,71">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="104" name="Constant_1612278" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="38809468" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="105" name="Constant_1612279" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="38809468" size="8" />
|
| <output>
|
| <port id="0" precision="I64" />
|
| </output>
|
| </layer>
|
| <layer id="106" name="Gather_1612280" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>2</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="I64" names="66">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="107" name="Constant_1611426" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="38809476" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="108" name="Constant_1612384" type="Const" version="opset1">
|
| <data element_type="i64" shape="2" offset="41003516" size="16" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>2</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="109" name="Constant_1612385" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="38809468" size="8" />
|
| <output>
|
| <port id="0" precision="I64" />
|
| </output>
|
| </layer>
|
| <layer id="110" name="Gather_1612386" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>2</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>2</dim>
|
| </port>
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="I64">
|
| <dim>2</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="111" name="__module.roberta/prim::ListConstruct/Concat_1" type="Concat" version="opset1">
|
| <data axis="0" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="2" precision="I64">
|
| <dim>2</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="3" precision="I64" names="72">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="112" name="__module.roberta/aten::expand/Broadcast_1" type="Broadcast" version="opset3">
|
| <data mode="bidirectional" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="I64" names="73">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="113" name="__module.roberta/aten::to/Convert" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="74">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="114" name="Constant_1612151" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 1, 1" offset="41003504" size="4" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="115" name="__module.roberta/aten::rsub/Multiply" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="116" name="__module.roberta/aten::rsub/Subtract" type="Subtract" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="75,inverted_mask">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="117" name="__module.roberta/aten::to/Convert_1" type="Convert" version="opset1">
|
| <data destination_type="boolean" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="BOOL" names="76">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="118" name="__module.roberta/aten::masked_fill/ConvertLike" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="41003532" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="119" name="__module.roberta/aten::masked_fill/Select" type="Select" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="BOOL">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="77">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="120" name="__module.roberta.encoder.layer.0.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="4" precision="FP32" names="127,attn_output.1">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="121" name="__module.roberta.encoder.layer.0.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
| <data element_type="i32" shape="4" offset="41003536" size="16" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="122" name="__module.roberta.encoder.layer.0.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="128,attn_output.3">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="123" name="Constant_1612282" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="41003552" size="24" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="124" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="130">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="125" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="41003576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="126" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="127" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="41006648" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="128" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="41006652" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="129" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="41006648" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="130" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="41006652" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="131" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="132" name="Constant_1827294" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="41006656" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="133" name="Convert_1827295" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="134" name="Constant_1827296" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="41596480" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="135" name="__module.roberta.encoder.layer.0.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="136" name="__module.roberta.encoder.layer.0.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="137" name="Constant_1612153" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="41599552" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="138" name="__module.roberta.encoder.layer.0.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="135,input.3">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="139" name="__module.roberta.encoder.layer.0.attention.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="137">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="140" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="141" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="142" name="Constant_1612154" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="41602624" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="143" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="144" name="Constant_1612155" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="41605696" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="145" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="141,input_tensor.1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="146" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="41608768" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="147" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="148" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="41611840" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="149" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="41611844" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="150" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="41611840" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="151" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="41611844" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="152" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="153" name="Constant_1827298" type="Const" version="opset1">
|
| <data element_type="i8" shape="3072, 768" offset="41611848" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="154" name="Convert_1827299" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="155" name="Constant_1827300" type="Const" version="opset1">
|
| <data element_type="f32" shape="3072, 1" offset="43971144" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="156" name="__module.roberta.encoder.layer.0.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="157" name="__module.roberta.encoder.layer.0.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="158" name="Constant_1612156" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="43983432" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="159" name="__module.roberta.encoder.layer.0.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="145">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="160" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="146">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="161" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="43995720" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="162" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="163" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="44008008" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="164" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="44008012" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="165" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="44008008" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="166" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="44008012" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="167" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="168" name="Constant_1827302" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 3072" offset="44008016" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="169" name="Convert_1827303" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="170" name="Constant_1827304" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="46367312" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="171" name="__module.roberta.encoder.layer.0.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="172" name="__module.roberta.encoder.layer.0.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="173" name="Constant_1612157" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="46370384" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="174" name="__module.roberta.encoder.layer.0.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="151,input.5">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="175" name="__module.roberta.encoder.layer.0.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="153">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="176" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="177" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="178" name="Constant_1612158" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="46373456" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="179" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="180" name="Constant_1612159" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="46376528" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="181" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="157,hidden_states.7">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="182" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="46379600" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="183" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="184" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="46382672" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="185" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="46382676" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="186" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="46382672" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="187" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="46382676" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="188" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="189" name="Constant_1827306" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="46382680" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="190" name="Convert_1827307" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="191" name="Constant_1827308" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="46972504" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="192" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="193" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="194" name="Constant_1612160" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="46975576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="195" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="170,x.13">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="196" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="46978648" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="197" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="46978652" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="198" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="46978648" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="199" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="46978652" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="200" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="201" name="__module.roberta.encoder.layer.1.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="202" name="__module.roberta.encoder.layer.1.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="174,x.15">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="203" name="Constant_1607240" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="175">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="204" name="__module.roberta.encoder.layer.1.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="176">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="205" name="Constant_1827310" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="46978656" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="206" name="Convert_1827311" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="207" name="Constant_1827312" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="47568480" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="208" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="209" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="210" name="Constant_1612161" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="47571552" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="211" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="179,x.17">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="212" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="47574624" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="213" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="47574628" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="214" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="47574624" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="215" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="47574628" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="216" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="217" name="__module.roberta.encoder.layer.1.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="218" name="__module.roberta.encoder.layer.1.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="183,x.19">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="219" name="Constant_1607263" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="184">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="220" name="__module.roberta.encoder.layer.1.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="185">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="221" name="Constant_1827314" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="47574632" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="222" name="Convert_1827315" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="223" name="Constant_1827316" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="48164456" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="224" name="__module.roberta.encoder.layer.1.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="225" name="__module.roberta.encoder.layer.1.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="226" name="Constant_1612162" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="48167528" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="227" name="__module.roberta.encoder.layer.1.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="188,x.21">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="228" name="__module.roberta.encoder.layer.1.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="229" name="__module.roberta.encoder.layer.1.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="192,x.23">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="230" name="Constant_1607286" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="193">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="231" name="__module.roberta.encoder.layer.1.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="194">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="232" name="__module.roberta.encoder.layer.1.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="4" precision="FP32" names="195,attn_output.5">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="233" name="__module.roberta.encoder.layer.1.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
| <data element_type="i32" shape="4" offset="41003536" size="16" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="234" name="__module.roberta.encoder.layer.1.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="196,attn_output.7">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="235" name="Constant_1612283" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="41003552" size="24" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="236" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="198">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="237" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="48170600" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="238" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="239" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="48173672" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="240" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="48173676" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="241" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="48173672" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="242" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="48173676" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="243" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="244" name="Constant_1827318" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="48173680" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="245" name="Convert_1827319" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="246" name="Constant_1827320" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="48763504" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="247" name="__module.roberta.encoder.layer.1.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="248" name="__module.roberta.encoder.layer.1.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="249" name="Constant_1612163" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="48766576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="250" name="__module.roberta.encoder.layer.1.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="203,input.7">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="251" name="__module.roberta.encoder.layer.1.attention.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="205">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="252" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="253" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="254" name="Constant_1612164" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="48769648" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="255" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="256" name="Constant_1612165" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="48772720" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="257" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="209,input_tensor.3">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="258" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="48775792" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="259" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="260" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="48778864" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="261" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="48778868" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="262" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="48778864" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="263" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="48778868" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="264" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="265" name="Constant_1827322" type="Const" version="opset1">
|
| <data element_type="i8" shape="3072, 768" offset="48778872" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="266" name="Convert_1827323" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="267" name="Constant_1827324" type="Const" version="opset1">
|
| <data element_type="f32" shape="3072, 1" offset="51138168" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="268" name="__module.roberta.encoder.layer.1.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="269" name="__module.roberta.encoder.layer.1.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="270" name="Constant_1612166" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="51150456" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="271" name="__module.roberta.encoder.layer.1.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="213">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="272" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="214">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="273" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="51162744" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="274" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="275" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="51175032" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="276" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="51175036" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="277" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="51175032" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="278" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="51175036" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="279" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="280" name="Constant_1827326" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 3072" offset="51175040" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="281" name="Convert_1827327" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="282" name="Constant_1827328" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="53534336" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="283" name="__module.roberta.encoder.layer.1.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="284" name="__module.roberta.encoder.layer.1.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="285" name="Constant_1612167" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="53537408" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="286" name="__module.roberta.encoder.layer.1.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="219,input.9">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="287" name="__module.roberta.encoder.layer.1.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="221">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="288" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="289" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="290" name="Constant_1612168" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="53540480" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="291" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="292" name="Constant_1612169" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="53543552" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="293" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="225,hidden_states.13">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="294" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="53546624" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="295" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="296" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="53549696" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="297" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="53549700" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="298" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="53549696" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="299" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="53549700" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="300" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="301" name="Constant_1827330" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="53549704" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="302" name="Convert_1827331" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="303" name="Constant_1827332" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="54139528" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="304" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="305" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="306" name="Constant_1612170" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="54142600" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="307" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="238,x.25">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="308" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="54145672" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="309" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="54145676" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="310" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="54145672" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="311" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="54145676" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="312" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="313" name="__module.roberta.encoder.layer.2.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="314" name="__module.roberta.encoder.layer.2.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="242,x.27">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="315" name="Constant_1607463" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="243">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="316" name="__module.roberta.encoder.layer.2.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="244">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="317" name="Constant_1827334" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="54145680" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="318" name="Convert_1827335" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="319" name="Constant_1827336" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="54735504" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="320" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="321" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="322" name="Constant_1612171" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="54738576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="323" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="247,x.29">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="324" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="54741648" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="325" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="54741652" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="326" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="54741648" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="327" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="54741652" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="328" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="329" name="__module.roberta.encoder.layer.2.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="330" name="__module.roberta.encoder.layer.2.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="251,x.31">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="331" name="Constant_1607486" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="252">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="332" name="__module.roberta.encoder.layer.2.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="253">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="333" name="Constant_1827338" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="54741656" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="334" name="Convert_1827339" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="335" name="Constant_1827340" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="55331480" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="336" name="__module.roberta.encoder.layer.2.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="337" name="__module.roberta.encoder.layer.2.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="338" name="Constant_1612172" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="55334552" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="339" name="__module.roberta.encoder.layer.2.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="256,x.33">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="340" name="__module.roberta.encoder.layer.2.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="341" name="__module.roberta.encoder.layer.2.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="260,x.35">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="342" name="Constant_1607509" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="261">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="343" name="__module.roberta.encoder.layer.2.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="262">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="344" name="__module.roberta.encoder.layer.2.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="4" precision="FP32" names="263,attn_output.9">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="345" name="__module.roberta.encoder.layer.2.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
| <data element_type="i32" shape="4" offset="41003536" size="16" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="346" name="__module.roberta.encoder.layer.2.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="264,attn_output.11">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="347" name="Constant_1612284" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="41003552" size="24" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="348" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="266">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="349" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="55337624" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="350" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="351" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="55340696" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="352" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="55340700" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="353" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="55340696" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="354" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="55340700" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="355" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="356" name="Constant_1827342" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="55340704" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="357" name="Convert_1827343" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="358" name="Constant_1827344" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="55930528" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="359" name="__module.roberta.encoder.layer.2.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="360" name="__module.roberta.encoder.layer.2.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="361" name="Constant_1612173" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="55933600" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="362" name="__module.roberta.encoder.layer.2.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="271,input.11">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="363" name="__module.roberta.encoder.layer.2.attention.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="273">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="364" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="365" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="366" name="Constant_1612174" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="55936672" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="367" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="368" name="Constant_1612175" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="55939744" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="369" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="277,input_tensor.5">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="370" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="55942816" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="371" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="372" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="55945888" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="373" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="55945892" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="374" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="55945888" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="375" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="55945892" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="376" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="377" name="Constant_1827346" type="Const" version="opset1">
|
| <data element_type="i8" shape="3072, 768" offset="55945896" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="378" name="Convert_1827347" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="379" name="Constant_1827348" type="Const" version="opset1">
|
| <data element_type="f32" shape="3072, 1" offset="58305192" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="380" name="__module.roberta.encoder.layer.2.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="381" name="__module.roberta.encoder.layer.2.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="382" name="Constant_1612176" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="58317480" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="383" name="__module.roberta.encoder.layer.2.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="281">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="384" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="282">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="385" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="58329768" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="386" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="387" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="58342056" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="388" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="58342060" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="389" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="58342056" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="390" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="58342060" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="391" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="392" name="Constant_1827350" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 3072" offset="58342064" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="393" name="Convert_1827351" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="394" name="Constant_1827352" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="60701360" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="395" name="__module.roberta.encoder.layer.2.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="396" name="__module.roberta.encoder.layer.2.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="397" name="Constant_1612177" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="60704432" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="398" name="__module.roberta.encoder.layer.2.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="287,input.13">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="399" name="__module.roberta.encoder.layer.2.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="289">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="400" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="401" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="402" name="Constant_1612178" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="60707504" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="403" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="404" name="Constant_1612179" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="60710576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="405" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="293,hidden_states.19">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="406" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="60713648" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="407" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="408" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="60716720" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="409" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="60716724" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="410" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="60716720" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="411" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="60716724" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="412" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="413" name="Constant_1827354" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="60716728" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="414" name="Convert_1827355" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="415" name="Constant_1827356" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="61306552" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="416" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="417" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="418" name="Constant_1612180" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="61309624" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="419" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="306,x.37">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="420" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="61312696" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="421" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="61312700" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="422" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="61312696" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="423" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="61312700" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="424" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="425" name="__module.roberta.encoder.layer.3.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="426" name="__module.roberta.encoder.layer.3.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="310,x.39">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="427" name="Constant_1607686" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="311">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="428" name="__module.roberta.encoder.layer.3.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="312">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="429" name="Constant_1827358" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="61312704" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="430" name="Convert_1827359" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="431" name="Constant_1827360" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="61902528" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="432" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="433" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="434" name="Constant_1612181" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="61905600" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="435" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="315,x.41">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="436" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="61908672" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="437" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="61908676" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="438" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="61908672" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="439" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="61908676" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="440" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="441" name="__module.roberta.encoder.layer.3.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="442" name="__module.roberta.encoder.layer.3.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="319,x.43">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="443" name="Constant_1607709" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="320">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="444" name="__module.roberta.encoder.layer.3.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="321">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="445" name="Constant_1827362" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="61908680" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="446" name="Convert_1827363" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="447" name="Constant_1827364" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="62498504" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="448" name="__module.roberta.encoder.layer.3.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="449" name="__module.roberta.encoder.layer.3.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="450" name="Constant_1612182" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="62501576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="451" name="__module.roberta.encoder.layer.3.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="324,x.45">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="452" name="__module.roberta.encoder.layer.3.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="453" name="__module.roberta.encoder.layer.3.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="328,x.47">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="454" name="Constant_1607732" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="329">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="455" name="__module.roberta.encoder.layer.3.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="330">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="456" name="__module.roberta.encoder.layer.3.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="4" precision="FP32" names="331,attn_output.13">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="457" name="__module.roberta.encoder.layer.3.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
| <data element_type="i32" shape="4" offset="41003536" size="16" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="458" name="__module.roberta.encoder.layer.3.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="332,attn_output.15">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="459" name="Constant_1612285" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="41003552" size="24" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="460" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="334">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="461" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="62504648" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="462" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="463" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="62507720" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="464" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="62507724" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="465" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="62507720" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="466" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="62507724" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="467" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="468" name="Constant_1827366" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="62507728" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="469" name="Convert_1827367" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="470" name="Constant_1827368" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="63097552" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="471" name="__module.roberta.encoder.layer.3.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="472" name="__module.roberta.encoder.layer.3.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="473" name="Constant_1612183" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="63100624" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="474" name="__module.roberta.encoder.layer.3.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="339,input.15">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="475" name="__module.roberta.encoder.layer.3.attention.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="341">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="476" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="477" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="478" name="Constant_1612184" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="63103696" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="479" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="480" name="Constant_1612185" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="63106768" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="481" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="345,input_tensor.7">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="482" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="63109840" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="483" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="484" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="63112912" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="485" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="63112916" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="486" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="63112912" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="487" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="63112916" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="488" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="489" name="Constant_1827370" type="Const" version="opset1">
|
| <data element_type="i8" shape="3072, 768" offset="63112920" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="490" name="Convert_1827371" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="491" name="Constant_1827372" type="Const" version="opset1">
|
| <data element_type="f32" shape="3072, 1" offset="65472216" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="492" name="__module.roberta.encoder.layer.3.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="493" name="__module.roberta.encoder.layer.3.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="494" name="Constant_1612186" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="65484504" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="495" name="__module.roberta.encoder.layer.3.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="349">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="496" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="350">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="497" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="65496792" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="498" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="499" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="65509080" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="500" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="65509084" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="501" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="65509080" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="502" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="65509084" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="503" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="504" name="Constant_1827374" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 3072" offset="65509088" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="505" name="Convert_1827375" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="506" name="Constant_1827376" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="67868384" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="507" name="__module.roberta.encoder.layer.3.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="508" name="__module.roberta.encoder.layer.3.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="509" name="Constant_1612187" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="67871456" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="510" name="__module.roberta.encoder.layer.3.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="355,input.17">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="511" name="__module.roberta.encoder.layer.3.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="357">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="512" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="513" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="514" name="Constant_1612188" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="67874528" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="515" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="516" name="Constant_1612189" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="67877600" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="517" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="361,hidden_states.25">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="518" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="67880672" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="519" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="520" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="67883744" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="521" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="67883748" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="522" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="67883744" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="523" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="67883748" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="524" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="525" name="Constant_1827378" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="67883752" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="526" name="Convert_1827379" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="527" name="Constant_1827380" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="68473576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="528" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="529" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="530" name="Constant_1612190" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="68476648" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="531" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="374,x.49">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="532" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="68479720" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="533" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="68479724" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="534" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="68479720" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="535" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="68479724" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="536" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="537" name="__module.roberta.encoder.layer.4.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="538" name="__module.roberta.encoder.layer.4.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="378,x.51">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="539" name="Constant_1607909" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="379">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="540" name="__module.roberta.encoder.layer.4.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="380">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="541" name="Constant_1827382" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="68479728" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="542" name="Convert_1827383" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="543" name="Constant_1827384" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="69069552" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="544" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="545" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="546" name="Constant_1612191" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="69072624" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="547" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="383,x.53">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="548" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="69075696" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="549" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="69075700" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="550" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="69075696" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="551" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="69075700" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="552" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="553" name="__module.roberta.encoder.layer.4.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="554" name="__module.roberta.encoder.layer.4.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="387,x.55">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="555" name="Constant_1607932" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="388">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="556" name="__module.roberta.encoder.layer.4.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="389">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="557" name="Constant_1827386" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="69075704" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="558" name="Convert_1827387" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="559" name="Constant_1827388" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="69665528" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="560" name="__module.roberta.encoder.layer.4.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="561" name="__module.roberta.encoder.layer.4.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="562" name="Constant_1612192" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="69668600" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="563" name="__module.roberta.encoder.layer.4.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="392,x.57">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="564" name="__module.roberta.encoder.layer.4.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="565" name="__module.roberta.encoder.layer.4.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="396,x.59">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="566" name="Constant_1607955" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="397">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="567" name="__module.roberta.encoder.layer.4.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="398">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="568" name="__module.roberta.encoder.layer.4.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="4" precision="FP32" names="399,attn_output.17">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="569" name="__module.roberta.encoder.layer.4.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
| <data element_type="i32" shape="4" offset="41003536" size="16" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="570" name="__module.roberta.encoder.layer.4.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="400,attn_output.19">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="571" name="Constant_1612286" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="41003552" size="24" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="572" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="402">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="573" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="69671672" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="574" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="575" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="69674744" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="576" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="69674748" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="577" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="69674744" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="578" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="69674748" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="579" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="580" name="Constant_1827390" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="69674752" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="581" name="Convert_1827391" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="582" name="Constant_1827392" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="70264576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="583" name="__module.roberta.encoder.layer.4.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="584" name="__module.roberta.encoder.layer.4.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="585" name="Constant_1612193" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="70267648" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="586" name="__module.roberta.encoder.layer.4.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="407,input.19">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="587" name="__module.roberta.encoder.layer.4.attention.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="409">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="588" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="589" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="590" name="Constant_1612194" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="70270720" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="591" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="592" name="Constant_1612195" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="70273792" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="593" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="413,input_tensor.9">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="594" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="70276864" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="595" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="596" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="70279936" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="597" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="70279940" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="598" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="70279936" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="599" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="70279940" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="600" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="601" name="Constant_1827394" type="Const" version="opset1">
|
| <data element_type="i8" shape="3072, 768" offset="70279944" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="602" name="Convert_1827395" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="603" name="Constant_1827396" type="Const" version="opset1">
|
| <data element_type="f32" shape="3072, 1" offset="72639240" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="604" name="__module.roberta.encoder.layer.4.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="605" name="__module.roberta.encoder.layer.4.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="606" name="Constant_1612196" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="72651528" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="607" name="__module.roberta.encoder.layer.4.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="417">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="608" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="418">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="609" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="72663816" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="610" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="611" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="72676104" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="612" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="72676108" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="613" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="72676104" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="614" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="72676108" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="615" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="616" name="Constant_1827398" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 3072" offset="72676112" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="617" name="Convert_1827399" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="618" name="Constant_1827400" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="75035408" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="619" name="__module.roberta.encoder.layer.4.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="620" name="__module.roberta.encoder.layer.4.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="621" name="Constant_1612197" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="75038480" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="622" name="__module.roberta.encoder.layer.4.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="423,input.21">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="623" name="__module.roberta.encoder.layer.4.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="425">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="624" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="625" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="626" name="Constant_1612198" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="75041552" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="627" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="628" name="Constant_1612199" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="75044624" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="629" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="429,hidden_states.31">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="630" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="75047696" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="631" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="632" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="75050768" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="633" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="75050772" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="634" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="75050768" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="635" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="75050772" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="636" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="637" name="Constant_1827402" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="75050776" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="638" name="Convert_1827403" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="639" name="Constant_1827404" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="75640600" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="640" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="641" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="642" name="Constant_1612200" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="75643672" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="643" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="442,x.61">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="644" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="75646744" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="645" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="75646748" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="646" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="75646744" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="647" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="75646748" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="648" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="649" name="__module.roberta.encoder.layer.5.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="650" name="__module.roberta.encoder.layer.5.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="446,x.63">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="651" name="Constant_1608132" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="447">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="652" name="__module.roberta.encoder.layer.5.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="448">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="653" name="Constant_1827406" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="75646752" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="654" name="Convert_1827407" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="655" name="Constant_1827408" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="76236576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="656" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="657" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="658" name="Constant_1612201" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="76239648" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="659" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="451,x.65">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="660" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="76242720" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="661" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="76242724" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="662" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="76242720" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="663" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="76242724" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="664" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="665" name="__module.roberta.encoder.layer.5.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="666" name="__module.roberta.encoder.layer.5.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="455,x.67">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="667" name="Constant_1608155" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="456">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="668" name="__module.roberta.encoder.layer.5.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="457">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="669" name="Constant_1827410" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="76242728" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="670" name="Convert_1827411" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="671" name="Constant_1827412" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="76832552" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="672" name="__module.roberta.encoder.layer.5.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="673" name="__module.roberta.encoder.layer.5.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="674" name="Constant_1612202" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="76835624" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="675" name="__module.roberta.encoder.layer.5.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="460,x.69">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="676" name="__module.roberta.encoder.layer.5.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811496" size="32" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="677" name="__module.roberta.encoder.layer.5.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="464,x">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="678" name="Constant_1608178" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="39811528" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="465">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="679" name="__module.roberta.encoder.layer.5.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="466">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="680" name="__module.roberta.encoder.layer.5.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="4" precision="FP32" names="467,attn_output.21">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="681" name="__module.roberta.encoder.layer.5.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
| <data element_type="i32" shape="4" offset="41003536" size="16" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="682" name="__module.roberta.encoder.layer.5.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="468,attn_output">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="683" name="Constant_1612287" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="41003552" size="24" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="684" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="470">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="685" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="76838696" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="686" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="687" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="76841768" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="688" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="76841772" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="689" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="76841768" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="690" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="76841772" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="691" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="692" name="Constant_1827414" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="76841776" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="693" name="Convert_1827415" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="694" name="Constant_1827416" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="77431600" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="695" name="__module.roberta.encoder.layer.5.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="696" name="__module.roberta.encoder.layer.5.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="697" name="Constant_1612203" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="77434672" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="698" name="__module.roberta.encoder.layer.5.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="475,input.23">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="699" name="__module.roberta.encoder.layer.5.attention.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="477">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="700" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="701" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="702" name="Constant_1612204" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="77437744" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="703" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="704" name="Constant_1612205" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="77440816" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="705" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="481,input_tensor">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="706" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="77443888" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="707" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="708" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="77446960" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="709" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="77446964" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="710" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="77446960" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="711" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="77446964" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="712" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="713" name="Constant_1827418" type="Const" version="opset1">
|
| <data element_type="i8" shape="3072, 768" offset="77446968" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="714" name="Convert_1827419" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="715" name="Constant_1827420" type="Const" version="opset1">
|
| <data element_type="f32" shape="3072, 1" offset="79806264" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="716" name="__module.roberta.encoder.layer.5.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="717" name="__module.roberta.encoder.layer.5.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="718" name="Constant_1612206" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="79818552" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="719" name="__module.roberta.encoder.layer.5.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="485">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="720" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="486">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="721" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 3072" offset="79830840" size="12288" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="722" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="723" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="79843128" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="724" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="79843132" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="725" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="79843128" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="726" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="79843132" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="727" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="728" name="Constant_1827422" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 3072" offset="79843136" size="2359296" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="729" name="Convert_1827423" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="730" name="Constant_1827424" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="82202432" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="731" name="__module.roberta.encoder.layer.5.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="732" name="__module.roberta.encoder.layer.5.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="733" name="Constant_1612207" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="82205504" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="734" name="__module.roberta.encoder.layer.5.output.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="491,input.25">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="735" name="__module.roberta.encoder.layer.5.output/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="493">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="736" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="39206292" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="737" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="738" name="Constant_1612208" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="82208576" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="739" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="740" name="Constant_1612209" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1, 768" offset="82211648" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="741" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="497,506,features">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="742" name="502" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="38809468" size="8" />
|
| <output>
|
| <port id="0" precision="I64" names="502" />
|
| </output>
|
| </layer>
|
| <layer id="743" name="500" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="38809476" size="8" />
|
| <output>
|
| <port id="0" precision="I64" names="500" />
|
| </output>
|
| </layer>
|
| <layer id="744" name="__module.classifier/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="507,508,input.27">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="745" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 768" offset="82214720" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="746" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="747" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="82217792" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="748" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="82217796" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="749" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="82217792" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="750" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="82217796" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="751" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="752" name="Constant_1827426" type="Const" version="opset1">
|
| <data element_type="i8" shape="768, 768" offset="82217800" size="589824" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="753" name="Convert_1827427" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="754" name="Constant_1827428" type="Const" version="opset1">
|
| <data element_type="f32" shape="768, 1" offset="82807624" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="755" name="__module.classifier.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="756" name="__module.classifier.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="757" name="Constant_1612210" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 768" offset="82810696" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="758" name="__module.classifier.dense/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="512">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="759" name="__module.classifier/aten::tanh/Tanh" type="Tanh" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="513,input">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="760" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 768" offset="82813768" size="3072" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="761" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="762" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="82816840" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="763" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="82816844" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="764" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="82816840" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="765" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
| <data element_type="f32" shape="" offset="82816844" size="4" />
|
| <output>
|
| <port id="0" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="766" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
| <data levels="256" auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32" />
|
| <port id="2" precision="FP32" />
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="767" name="Constant_1827430" type="Const" version="opset1">
|
| <data element_type="i8" shape="1, 768" offset="82816848" size="768" />
|
| <output>
|
| <port id="0" precision="I8">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="768" name="Convert_1827431" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <input>
|
| <port id="0" precision="I8">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="769" name="Constant_1827432" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1" offset="82817616" size="4" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="770" name="__module.classifier.out_proj/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="771" name="__module.classifier.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="772" name="Constant_1612211" type="Const" version="opset1">
|
| <data element_type="f32" shape="1, 1" offset="82817620" size="4" />
|
| <output>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="773" name="__module.classifier.out_proj/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="logits">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="774" name="Result_1609187" type="Result" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| </layer>
|
| </layers>
|
| <edges>
|
| <edge from-layer="0" from-port="0" to-layer="101" to-port="0" />
|
| <edge from-layer="1" from-port="0" to-layer="6" to-port="0" />
|
| <edge from-layer="1" from-port="0" to-layer="15" to-port="0" />
|
| <edge from-layer="1" from-port="0" to-layer="32" to-port="0" />
|
| <edge from-layer="2" from-port="0" to-layer="3" to-port="0" />
|
| <edge from-layer="3" from-port="1" to-layer="5" to-port="0" />
|
| <edge from-layer="4" from-port="0" to-layer="5" to-port="1" />
|
| <edge from-layer="5" from-port="2" to-layer="8" to-port="0" />
|
| <edge from-layer="6" from-port="1" to-layer="8" to-port="1" />
|
| <edge from-layer="7" from-port="0" to-layer="8" to-port="2" />
|
| <edge from-layer="8" from-port="3" to-layer="26" to-port="0" />
|
| <edge from-layer="9" from-port="0" to-layer="10" to-port="0" />
|
| <edge from-layer="10" from-port="1" to-layer="12" to-port="0" />
|
| <edge from-layer="11" from-port="0" to-layer="12" to-port="1" />
|
| <edge from-layer="12" from-port="2" to-layer="25" to-port="0" />
|
| <edge from-layer="13" from-port="0" to-layer="21" to-port="0" />
|
| <edge from-layer="14" from-port="0" to-layer="21" to-port="1" />
|
| <edge from-layer="15" from-port="1" to-layer="18" to-port="0" />
|
| <edge from-layer="15" from-port="1" to-layer="22" to-port="1" />
|
| <edge from-layer="15" from-port="1" to-layer="110" to-port="0" />
|
| <edge from-layer="15" from-port="1" to-layer="106" to-port="0" />
|
| <edge from-layer="16" from-port="0" to-layer="18" to-port="1" />
|
| <edge from-layer="17" from-port="0" to-layer="18" to-port="2" />
|
| <edge from-layer="18" from-port="3" to-layer="21" to-port="2" />
|
| <edge from-layer="19" from-port="0" to-layer="21" to-port="3" />
|
| <edge from-layer="20" from-port="0" to-layer="21" to-port="4" />
|
| <edge from-layer="21" from-port="5" to-layer="22" to-port="0" />
|
| <edge from-layer="22" from-port="2" to-layer="23" to-port="0" />
|
| <edge from-layer="23" from-port="1" to-layer="25" to-port="1" />
|
| <edge from-layer="24" from-port="0" to-layer="25" to-port="2" />
|
| <edge from-layer="25" from-port="3" to-layer="26" to-port="1" />
|
| <edge from-layer="26" from-port="2" to-layer="43" to-port="0" />
|
| <edge from-layer="27" from-port="0" to-layer="28" to-port="0" />
|
| <edge from-layer="28" from-port="1" to-layer="30" to-port="0" />
|
| <edge from-layer="29" from-port="0" to-layer="30" to-port="1" />
|
| <edge from-layer="30" from-port="2" to-layer="42" to-port="0" />
|
| <edge from-layer="31" from-port="0" to-layer="32" to-port="1" />
|
| <edge from-layer="32" from-port="2" to-layer="33" to-port="0" />
|
| <edge from-layer="33" from-port="1" to-layer="35" to-port="0" />
|
| <edge from-layer="33" from-port="1" to-layer="36" to-port="1" />
|
| <edge from-layer="34" from-port="0" to-layer="35" to-port="1" />
|
| <edge from-layer="34" from-port="0" to-layer="101" to-port="1" />
|
| <edge from-layer="35" from-port="2" to-layer="36" to-port="0" />
|
| <edge from-layer="36" from-port="2" to-layer="37" to-port="0" />
|
| <edge from-layer="37" from-port="1" to-layer="39" to-port="0" />
|
| <edge from-layer="38" from-port="0" to-layer="39" to-port="1" />
|
| <edge from-layer="39" from-port="2" to-layer="40" to-port="0" />
|
| <edge from-layer="40" from-port="1" to-layer="42" to-port="1" />
|
| <edge from-layer="41" from-port="0" to-layer="42" to-port="2" />
|
| <edge from-layer="42" from-port="3" to-layer="43" to-port="1" />
|
| <edge from-layer="43" from-port="2" to-layer="45" to-port="0" />
|
| <edge from-layer="44" from-port="0" to-layer="45" to-port="1" />
|
| <edge from-layer="45" from-port="2" to-layer="47" to-port="0" />
|
| <edge from-layer="46" from-port="0" to-layer="47" to-port="1" />
|
| <edge from-layer="47" from-port="2" to-layer="49" to-port="0" />
|
| <edge from-layer="48" from-port="0" to-layer="49" to-port="1" />
|
| <edge from-layer="49" from-port="2" to-layer="51" to-port="0" />
|
| <edge from-layer="49" from-port="2" to-layer="139" to-port="1" />
|
| <edge from-layer="50" from-port="0" to-layer="51" to-port="1" />
|
| <edge from-layer="51" from-port="2" to-layer="56" to-port="0" />
|
| <edge from-layer="52" from-port="0" to-layer="56" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="56" to-port="2" />
|
| <edge from-layer="54" from-port="0" to-layer="56" to-port="3" />
|
| <edge from-layer="55" from-port="0" to-layer="56" to-port="4" />
|
| <edge from-layer="56" from-port="5" to-layer="61" to-port="0" />
|
| <edge from-layer="56" from-port="5" to-layer="77" to-port="0" />
|
| <edge from-layer="56" from-port="5" to-layer="93" to-port="0" />
|
| <edge from-layer="57" from-port="0" to-layer="58" to-port="0" />
|
| <edge from-layer="58" from-port="1" to-layer="60" to-port="0" />
|
| <edge from-layer="59" from-port="0" to-layer="60" to-port="1" />
|
| <edge from-layer="60" from-port="2" to-layer="61" to-port="1" />
|
| <edge from-layer="61" from-port="2" to-layer="63" to-port="0" />
|
| <edge from-layer="62" from-port="0" to-layer="63" to-port="1" />
|
| <edge from-layer="63" from-port="2" to-layer="68" to-port="0" />
|
| <edge from-layer="64" from-port="0" to-layer="68" to-port="1" />
|
| <edge from-layer="65" from-port="0" to-layer="68" to-port="2" />
|
| <edge from-layer="66" from-port="0" to-layer="68" to-port="3" />
|
| <edge from-layer="67" from-port="0" to-layer="68" to-port="4" />
|
| <edge from-layer="68" from-port="5" to-layer="70" to-port="0" />
|
| <edge from-layer="69" from-port="0" to-layer="70" to-port="1" />
|
| <edge from-layer="70" from-port="2" to-layer="72" to-port="0" />
|
| <edge from-layer="71" from-port="0" to-layer="72" to-port="1" />
|
| <edge from-layer="72" from-port="2" to-layer="120" to-port="0" />
|
| <edge from-layer="73" from-port="0" to-layer="74" to-port="0" />
|
| <edge from-layer="74" from-port="1" to-layer="76" to-port="0" />
|
| <edge from-layer="75" from-port="0" to-layer="76" to-port="1" />
|
| <edge from-layer="76" from-port="2" to-layer="77" to-port="1" />
|
| <edge from-layer="77" from-port="2" to-layer="79" to-port="0" />
|
| <edge from-layer="78" from-port="0" to-layer="79" to-port="1" />
|
| <edge from-layer="79" from-port="2" to-layer="84" to-port="0" />
|
| <edge from-layer="80" from-port="0" to-layer="84" to-port="1" />
|
| <edge from-layer="81" from-port="0" to-layer="84" to-port="2" />
|
| <edge from-layer="82" from-port="0" to-layer="84" to-port="3" />
|
| <edge from-layer="83" from-port="0" to-layer="84" to-port="4" />
|
| <edge from-layer="84" from-port="5" to-layer="86" to-port="0" />
|
| <edge from-layer="85" from-port="0" to-layer="86" to-port="1" />
|
| <edge from-layer="86" from-port="2" to-layer="88" to-port="0" />
|
| <edge from-layer="87" from-port="0" to-layer="88" to-port="1" />
|
| <edge from-layer="88" from-port="2" to-layer="120" to-port="1" />
|
| <edge from-layer="89" from-port="0" to-layer="90" to-port="0" />
|
| <edge from-layer="90" from-port="1" to-layer="92" to-port="0" />
|
| <edge from-layer="91" from-port="0" to-layer="92" to-port="1" />
|
| <edge from-layer="92" from-port="2" to-layer="93" to-port="1" />
|
| <edge from-layer="93" from-port="2" to-layer="95" to-port="0" />
|
| <edge from-layer="94" from-port="0" to-layer="95" to-port="1" />
|
| <edge from-layer="95" from-port="2" to-layer="97" to-port="0" />
|
| <edge from-layer="96" from-port="0" to-layer="97" to-port="1" />
|
| <edge from-layer="97" from-port="2" to-layer="99" to-port="0" />
|
| <edge from-layer="98" from-port="0" to-layer="99" to-port="1" />
|
| <edge from-layer="99" from-port="2" to-layer="120" to-port="2" />
|
| <edge from-layer="100" from-port="0" to-layer="116" to-port="0" />
|
| <edge from-layer="101" from-port="2" to-layer="103" to-port="0" />
|
| <edge from-layer="102" from-port="0" to-layer="103" to-port="1" />
|
| <edge from-layer="103" from-port="2" to-layer="112" to-port="0" />
|
| <edge from-layer="104" from-port="0" to-layer="106" to-port="1" />
|
| <edge from-layer="105" from-port="0" to-layer="106" to-port="2" />
|
| <edge from-layer="106" from-port="3" to-layer="111" to-port="0" />
|
| <edge from-layer="107" from-port="0" to-layer="111" to-port="1" />
|
| <edge from-layer="108" from-port="0" to-layer="110" to-port="1" />
|
| <edge from-layer="109" from-port="0" to-layer="110" to-port="2" />
|
| <edge from-layer="110" from-port="3" to-layer="111" to-port="2" />
|
| <edge from-layer="111" from-port="3" to-layer="112" to-port="1" />
|
| <edge from-layer="112" from-port="2" to-layer="113" to-port="0" />
|
| <edge from-layer="113" from-port="1" to-layer="115" to-port="0" />
|
| <edge from-layer="114" from-port="0" to-layer="115" to-port="1" />
|
| <edge from-layer="115" from-port="2" to-layer="116" to-port="1" />
|
| <edge from-layer="116" from-port="2" to-layer="117" to-port="0" />
|
| <edge from-layer="116" from-port="2" to-layer="119" to-port="2" />
|
| <edge from-layer="117" from-port="1" to-layer="119" to-port="0" />
|
| <edge from-layer="118" from-port="0" to-layer="119" to-port="1" />
|
| <edge from-layer="119" from-port="3" to-layer="120" to-port="3" />
|
| <edge from-layer="119" from-port="3" to-layer="456" to-port="3" />
|
| <edge from-layer="119" from-port="3" to-layer="568" to-port="3" />
|
| <edge from-layer="119" from-port="3" to-layer="232" to-port="3" />
|
| <edge from-layer="119" from-port="3" to-layer="680" to-port="3" />
|
| <edge from-layer="119" from-port="3" to-layer="344" to-port="3" />
|
| <edge from-layer="120" from-port="4" to-layer="122" to-port="0" />
|
| <edge from-layer="121" from-port="0" to-layer="122" to-port="1" />
|
| <edge from-layer="122" from-port="2" to-layer="124" to-port="0" />
|
| <edge from-layer="123" from-port="0" to-layer="124" to-port="1" />
|
| <edge from-layer="124" from-port="2" to-layer="126" to-port="0" />
|
| <edge from-layer="125" from-port="0" to-layer="126" to-port="1" />
|
| <edge from-layer="126" from-port="2" to-layer="131" to-port="0" />
|
| <edge from-layer="127" from-port="0" to-layer="131" to-port="1" />
|
| <edge from-layer="128" from-port="0" to-layer="131" to-port="2" />
|
| <edge from-layer="129" from-port="0" to-layer="131" to-port="3" />
|
| <edge from-layer="130" from-port="0" to-layer="131" to-port="4" />
|
| <edge from-layer="131" from-port="5" to-layer="136" to-port="0" />
|
| <edge from-layer="132" from-port="0" to-layer="133" to-port="0" />
|
| <edge from-layer="133" from-port="1" to-layer="135" to-port="0" />
|
| <edge from-layer="134" from-port="0" to-layer="135" to-port="1" />
|
| <edge from-layer="135" from-port="2" to-layer="136" to-port="1" />
|
| <edge from-layer="136" from-port="2" to-layer="138" to-port="0" />
|
| <edge from-layer="137" from-port="0" to-layer="138" to-port="1" />
|
| <edge from-layer="138" from-port="2" to-layer="139" to-port="0" />
|
| <edge from-layer="139" from-port="2" to-layer="141" to-port="0" />
|
| <edge from-layer="140" from-port="0" to-layer="141" to-port="1" />
|
| <edge from-layer="141" from-port="2" to-layer="143" to-port="0" />
|
| <edge from-layer="142" from-port="0" to-layer="143" to-port="1" />
|
| <edge from-layer="143" from-port="2" to-layer="145" to-port="0" />
|
| <edge from-layer="144" from-port="0" to-layer="145" to-port="1" />
|
| <edge from-layer="145" from-port="2" to-layer="147" to-port="0" />
|
| <edge from-layer="145" from-port="2" to-layer="175" to-port="1" />
|
| <edge from-layer="146" from-port="0" to-layer="147" to-port="1" />
|
| <edge from-layer="147" from-port="2" to-layer="152" to-port="0" />
|
| <edge from-layer="148" from-port="0" to-layer="152" to-port="1" />
|
| <edge from-layer="149" from-port="0" to-layer="152" to-port="2" />
|
| <edge from-layer="150" from-port="0" to-layer="152" to-port="3" />
|
| <edge from-layer="151" from-port="0" to-layer="152" to-port="4" />
|
| <edge from-layer="152" from-port="5" to-layer="157" to-port="0" />
|
| <edge from-layer="153" from-port="0" to-layer="154" to-port="0" />
|
| <edge from-layer="154" from-port="1" to-layer="156" to-port="0" />
|
| <edge from-layer="155" from-port="0" to-layer="156" to-port="1" />
|
| <edge from-layer="156" from-port="2" to-layer="157" to-port="1" />
|
| <edge from-layer="157" from-port="2" to-layer="159" to-port="0" />
|
| <edge from-layer="158" from-port="0" to-layer="159" to-port="1" />
|
| <edge from-layer="159" from-port="2" to-layer="160" to-port="0" />
|
| <edge from-layer="160" from-port="1" to-layer="162" to-port="0" />
|
| <edge from-layer="161" from-port="0" to-layer="162" to-port="1" />
|
| <edge from-layer="162" from-port="2" to-layer="167" to-port="0" />
|
| <edge from-layer="163" from-port="0" to-layer="167" to-port="1" />
|
| <edge from-layer="164" from-port="0" to-layer="167" to-port="2" />
|
| <edge from-layer="165" from-port="0" to-layer="167" to-port="3" />
|
| <edge from-layer="166" from-port="0" to-layer="167" to-port="4" />
|
| <edge from-layer="167" from-port="5" to-layer="172" to-port="0" />
|
| <edge from-layer="168" from-port="0" to-layer="169" to-port="0" />
|
| <edge from-layer="169" from-port="1" to-layer="171" to-port="0" />
|
| <edge from-layer="170" from-port="0" to-layer="171" to-port="1" />
|
| <edge from-layer="171" from-port="2" to-layer="172" to-port="1" />
|
| <edge from-layer="172" from-port="2" to-layer="174" to-port="0" />
|
| <edge from-layer="173" from-port="0" to-layer="174" to-port="1" />
|
| <edge from-layer="174" from-port="2" to-layer="175" to-port="0" />
|
| <edge from-layer="175" from-port="2" to-layer="177" to-port="0" />
|
| <edge from-layer="176" from-port="0" to-layer="177" to-port="1" />
|
| <edge from-layer="177" from-port="2" to-layer="179" to-port="0" />
|
| <edge from-layer="178" from-port="0" to-layer="179" to-port="1" />
|
| <edge from-layer="179" from-port="2" to-layer="181" to-port="0" />
|
| <edge from-layer="180" from-port="0" to-layer="181" to-port="1" />
|
| <edge from-layer="181" from-port="2" to-layer="183" to-port="0" />
|
| <edge from-layer="181" from-port="2" to-layer="251" to-port="1" />
|
| <edge from-layer="182" from-port="0" to-layer="183" to-port="1" />
|
| <edge from-layer="183" from-port="2" to-layer="188" to-port="0" />
|
| <edge from-layer="184" from-port="0" to-layer="188" to-port="1" />
|
| <edge from-layer="185" from-port="0" to-layer="188" to-port="2" />
|
| <edge from-layer="186" from-port="0" to-layer="188" to-port="3" />
|
| <edge from-layer="187" from-port="0" to-layer="188" to-port="4" />
|
| <edge from-layer="188" from-port="5" to-layer="193" to-port="0" />
|
| <edge from-layer="188" from-port="5" to-layer="225" to-port="0" />
|
| <edge from-layer="188" from-port="5" to-layer="209" to-port="0" />
|
| <edge from-layer="189" from-port="0" to-layer="190" to-port="0" />
|
| <edge from-layer="190" from-port="1" to-layer="192" to-port="0" />
|
| <edge from-layer="191" from-port="0" to-layer="192" to-port="1" />
|
| <edge from-layer="192" from-port="2" to-layer="193" to-port="1" />
|
| <edge from-layer="193" from-port="2" to-layer="195" to-port="0" />
|
| <edge from-layer="194" from-port="0" to-layer="195" to-port="1" />
|
| <edge from-layer="195" from-port="2" to-layer="200" to-port="0" />
|
| <edge from-layer="196" from-port="0" to-layer="200" to-port="1" />
|
| <edge from-layer="197" from-port="0" to-layer="200" to-port="2" />
|
| <edge from-layer="198" from-port="0" to-layer="200" to-port="3" />
|
| <edge from-layer="199" from-port="0" to-layer="200" to-port="4" />
|
| <edge from-layer="200" from-port="5" to-layer="202" to-port="0" />
|
| <edge from-layer="201" from-port="0" to-layer="202" to-port="1" />
|
| <edge from-layer="202" from-port="2" to-layer="204" to-port="0" />
|
| <edge from-layer="203" from-port="0" to-layer="204" to-port="1" />
|
| <edge from-layer="204" from-port="2" to-layer="232" to-port="0" />
|
| <edge from-layer="205" from-port="0" to-layer="206" to-port="0" />
|
| <edge from-layer="206" from-port="1" to-layer="208" to-port="0" />
|
| <edge from-layer="207" from-port="0" to-layer="208" to-port="1" />
|
| <edge from-layer="208" from-port="2" to-layer="209" to-port="1" />
|
| <edge from-layer="209" from-port="2" to-layer="211" to-port="0" />
|
| <edge from-layer="210" from-port="0" to-layer="211" to-port="1" />
|
| <edge from-layer="211" from-port="2" to-layer="216" to-port="0" />
|
| <edge from-layer="212" from-port="0" to-layer="216" to-port="1" />
|
| <edge from-layer="213" from-port="0" to-layer="216" to-port="2" />
|
| <edge from-layer="214" from-port="0" to-layer="216" to-port="3" />
|
| <edge from-layer="215" from-port="0" to-layer="216" to-port="4" />
|
| <edge from-layer="216" from-port="5" to-layer="218" to-port="0" />
|
| <edge from-layer="217" from-port="0" to-layer="218" to-port="1" />
|
| <edge from-layer="218" from-port="2" to-layer="220" to-port="0" />
|
| <edge from-layer="219" from-port="0" to-layer="220" to-port="1" />
|
| <edge from-layer="220" from-port="2" to-layer="232" to-port="1" />
|
| <edge from-layer="221" from-port="0" to-layer="222" to-port="0" />
|
| <edge from-layer="222" from-port="1" to-layer="224" to-port="0" />
|
| <edge from-layer="223" from-port="0" to-layer="224" to-port="1" />
|
| <edge from-layer="224" from-port="2" to-layer="225" to-port="1" />
|
| <edge from-layer="225" from-port="2" to-layer="227" to-port="0" />
|
| <edge from-layer="226" from-port="0" to-layer="227" to-port="1" />
|
| <edge from-layer="227" from-port="2" to-layer="229" to-port="0" />
|
| <edge from-layer="228" from-port="0" to-layer="229" to-port="1" />
|
| <edge from-layer="229" from-port="2" to-layer="231" to-port="0" />
|
| <edge from-layer="230" from-port="0" to-layer="231" to-port="1" />
|
| <edge from-layer="231" from-port="2" to-layer="232" to-port="2" />
|
| <edge from-layer="232" from-port="4" to-layer="234" to-port="0" />
|
| <edge from-layer="233" from-port="0" to-layer="234" to-port="1" />
|
| <edge from-layer="234" from-port="2" to-layer="236" to-port="0" />
|
| <edge from-layer="235" from-port="0" to-layer="236" to-port="1" />
|
| <edge from-layer="236" from-port="2" to-layer="238" to-port="0" />
|
| <edge from-layer="237" from-port="0" to-layer="238" to-port="1" />
|
| <edge from-layer="238" from-port="2" to-layer="243" to-port="0" />
|
| <edge from-layer="239" from-port="0" to-layer="243" to-port="1" />
|
| <edge from-layer="240" from-port="0" to-layer="243" to-port="2" />
|
| <edge from-layer="241" from-port="0" to-layer="243" to-port="3" />
|
| <edge from-layer="242" from-port="0" to-layer="243" to-port="4" />
|
| <edge from-layer="243" from-port="5" to-layer="248" to-port="0" />
|
| <edge from-layer="244" from-port="0" to-layer="245" to-port="0" />
|
| <edge from-layer="245" from-port="1" to-layer="247" to-port="0" />
|
| <edge from-layer="246" from-port="0" to-layer="247" to-port="1" />
|
| <edge from-layer="247" from-port="2" to-layer="248" to-port="1" />
|
| <edge from-layer="248" from-port="2" to-layer="250" to-port="0" />
|
| <edge from-layer="249" from-port="0" to-layer="250" to-port="1" />
|
| <edge from-layer="250" from-port="2" to-layer="251" to-port="0" />
|
| <edge from-layer="251" from-port="2" to-layer="253" to-port="0" />
|
| <edge from-layer="252" from-port="0" to-layer="253" to-port="1" />
|
| <edge from-layer="253" from-port="2" to-layer="255" to-port="0" />
|
| <edge from-layer="254" from-port="0" to-layer="255" to-port="1" />
|
| <edge from-layer="255" from-port="2" to-layer="257" to-port="0" />
|
| <edge from-layer="256" from-port="0" to-layer="257" to-port="1" />
|
| <edge from-layer="257" from-port="2" to-layer="259" to-port="0" />
|
| <edge from-layer="257" from-port="2" to-layer="287" to-port="1" />
|
| <edge from-layer="258" from-port="0" to-layer="259" to-port="1" />
|
| <edge from-layer="259" from-port="2" to-layer="264" to-port="0" />
|
| <edge from-layer="260" from-port="0" to-layer="264" to-port="1" />
|
| <edge from-layer="261" from-port="0" to-layer="264" to-port="2" />
|
| <edge from-layer="262" from-port="0" to-layer="264" to-port="3" />
|
| <edge from-layer="263" from-port="0" to-layer="264" to-port="4" />
|
| <edge from-layer="264" from-port="5" to-layer="269" to-port="0" />
|
| <edge from-layer="265" from-port="0" to-layer="266" to-port="0" />
|
| <edge from-layer="266" from-port="1" to-layer="268" to-port="0" />
|
| <edge from-layer="267" from-port="0" to-layer="268" to-port="1" />
|
| <edge from-layer="268" from-port="2" to-layer="269" to-port="1" />
|
| <edge from-layer="269" from-port="2" to-layer="271" to-port="0" />
|
| <edge from-layer="270" from-port="0" to-layer="271" to-port="1" />
|
| <edge from-layer="271" from-port="2" to-layer="272" to-port="0" />
|
| <edge from-layer="272" from-port="1" to-layer="274" to-port="0" />
|
| <edge from-layer="273" from-port="0" to-layer="274" to-port="1" />
|
| <edge from-layer="274" from-port="2" to-layer="279" to-port="0" />
|
| <edge from-layer="275" from-port="0" to-layer="279" to-port="1" />
|
| <edge from-layer="276" from-port="0" to-layer="279" to-port="2" />
|
| <edge from-layer="277" from-port="0" to-layer="279" to-port="3" />
|
| <edge from-layer="278" from-port="0" to-layer="279" to-port="4" />
|
| <edge from-layer="279" from-port="5" to-layer="284" to-port="0" />
|
| <edge from-layer="280" from-port="0" to-layer="281" to-port="0" />
|
| <edge from-layer="281" from-port="1" to-layer="283" to-port="0" />
|
| <edge from-layer="282" from-port="0" to-layer="283" to-port="1" />
|
| <edge from-layer="283" from-port="2" to-layer="284" to-port="1" />
|
| <edge from-layer="284" from-port="2" to-layer="286" to-port="0" />
|
| <edge from-layer="285" from-port="0" to-layer="286" to-port="1" />
|
| <edge from-layer="286" from-port="2" to-layer="287" to-port="0" />
|
| <edge from-layer="287" from-port="2" to-layer="289" to-port="0" />
|
| <edge from-layer="288" from-port="0" to-layer="289" to-port="1" />
|
| <edge from-layer="289" from-port="2" to-layer="291" to-port="0" />
|
| <edge from-layer="290" from-port="0" to-layer="291" to-port="1" />
|
| <edge from-layer="291" from-port="2" to-layer="293" to-port="0" />
|
| <edge from-layer="292" from-port="0" to-layer="293" to-port="1" />
|
| <edge from-layer="293" from-port="2" to-layer="363" to-port="1" />
|
| <edge from-layer="293" from-port="2" to-layer="295" to-port="0" />
|
| <edge from-layer="294" from-port="0" to-layer="295" to-port="1" />
|
| <edge from-layer="295" from-port="2" to-layer="300" to-port="0" />
|
| <edge from-layer="296" from-port="0" to-layer="300" to-port="1" />
|
| <edge from-layer="297" from-port="0" to-layer="300" to-port="2" />
|
| <edge from-layer="298" from-port="0" to-layer="300" to-port="3" />
|
| <edge from-layer="299" from-port="0" to-layer="300" to-port="4" />
|
| <edge from-layer="300" from-port="5" to-layer="305" to-port="0" />
|
| <edge from-layer="300" from-port="5" to-layer="337" to-port="0" />
|
| <edge from-layer="300" from-port="5" to-layer="321" to-port="0" />
|
| <edge from-layer="301" from-port="0" to-layer="302" to-port="0" />
|
| <edge from-layer="302" from-port="1" to-layer="304" to-port="0" />
|
| <edge from-layer="303" from-port="0" to-layer="304" to-port="1" />
|
| <edge from-layer="304" from-port="2" to-layer="305" to-port="1" />
|
| <edge from-layer="305" from-port="2" to-layer="307" to-port="0" />
|
| <edge from-layer="306" from-port="0" to-layer="307" to-port="1" />
|
| <edge from-layer="307" from-port="2" to-layer="312" to-port="0" />
|
| <edge from-layer="308" from-port="0" to-layer="312" to-port="1" />
|
| <edge from-layer="309" from-port="0" to-layer="312" to-port="2" />
|
| <edge from-layer="310" from-port="0" to-layer="312" to-port="3" />
|
| <edge from-layer="311" from-port="0" to-layer="312" to-port="4" />
|
| <edge from-layer="312" from-port="5" to-layer="314" to-port="0" />
|
| <edge from-layer="313" from-port="0" to-layer="314" to-port="1" />
|
| <edge from-layer="314" from-port="2" to-layer="316" to-port="0" />
|
| <edge from-layer="315" from-port="0" to-layer="316" to-port="1" />
|
| <edge from-layer="316" from-port="2" to-layer="344" to-port="0" />
|
| <edge from-layer="317" from-port="0" to-layer="318" to-port="0" />
|
| <edge from-layer="318" from-port="1" to-layer="320" to-port="0" />
|
| <edge from-layer="319" from-port="0" to-layer="320" to-port="1" />
|
| <edge from-layer="320" from-port="2" to-layer="321" to-port="1" />
|
| <edge from-layer="321" from-port="2" to-layer="323" to-port="0" />
|
| <edge from-layer="322" from-port="0" to-layer="323" to-port="1" />
|
| <edge from-layer="323" from-port="2" to-layer="328" to-port="0" />
|
| <edge from-layer="324" from-port="0" to-layer="328" to-port="1" />
|
| <edge from-layer="325" from-port="0" to-layer="328" to-port="2" />
|
| <edge from-layer="326" from-port="0" to-layer="328" to-port="3" />
|
| <edge from-layer="327" from-port="0" to-layer="328" to-port="4" />
|
| <edge from-layer="328" from-port="5" to-layer="330" to-port="0" />
|
| <edge from-layer="329" from-port="0" to-layer="330" to-port="1" />
|
| <edge from-layer="330" from-port="2" to-layer="332" to-port="0" />
|
| <edge from-layer="331" from-port="0" to-layer="332" to-port="1" />
|
| <edge from-layer="332" from-port="2" to-layer="344" to-port="1" />
|
| <edge from-layer="333" from-port="0" to-layer="334" to-port="0" />
|
| <edge from-layer="334" from-port="1" to-layer="336" to-port="0" />
|
| <edge from-layer="335" from-port="0" to-layer="336" to-port="1" />
|
| <edge from-layer="336" from-port="2" to-layer="337" to-port="1" />
|
| <edge from-layer="337" from-port="2" to-layer="339" to-port="0" />
|
| <edge from-layer="338" from-port="0" to-layer="339" to-port="1" />
|
| <edge from-layer="339" from-port="2" to-layer="341" to-port="0" />
|
| <edge from-layer="340" from-port="0" to-layer="341" to-port="1" />
|
| <edge from-layer="341" from-port="2" to-layer="343" to-port="0" />
|
| <edge from-layer="342" from-port="0" to-layer="343" to-port="1" />
|
| <edge from-layer="343" from-port="2" to-layer="344" to-port="2" />
|
| <edge from-layer="344" from-port="4" to-layer="346" to-port="0" />
|
| <edge from-layer="345" from-port="0" to-layer="346" to-port="1" />
|
| <edge from-layer="346" from-port="2" to-layer="348" to-port="0" />
|
| <edge from-layer="347" from-port="0" to-layer="348" to-port="1" />
|
| <edge from-layer="348" from-port="2" to-layer="350" to-port="0" />
|
| <edge from-layer="349" from-port="0" to-layer="350" to-port="1" />
|
| <edge from-layer="350" from-port="2" to-layer="355" to-port="0" />
|
| <edge from-layer="351" from-port="0" to-layer="355" to-port="1" />
|
| <edge from-layer="352" from-port="0" to-layer="355" to-port="2" />
|
| <edge from-layer="353" from-port="0" to-layer="355" to-port="3" />
|
| <edge from-layer="354" from-port="0" to-layer="355" to-port="4" />
|
| <edge from-layer="355" from-port="5" to-layer="360" to-port="0" />
|
| <edge from-layer="356" from-port="0" to-layer="357" to-port="0" />
|
| <edge from-layer="357" from-port="1" to-layer="359" to-port="0" />
|
| <edge from-layer="358" from-port="0" to-layer="359" to-port="1" />
|
| <edge from-layer="359" from-port="2" to-layer="360" to-port="1" />
|
| <edge from-layer="360" from-port="2" to-layer="362" to-port="0" />
|
| <edge from-layer="361" from-port="0" to-layer="362" to-port="1" />
|
| <edge from-layer="362" from-port="2" to-layer="363" to-port="0" />
|
| <edge from-layer="363" from-port="2" to-layer="365" to-port="0" />
|
| <edge from-layer="364" from-port="0" to-layer="365" to-port="1" />
|
| <edge from-layer="365" from-port="2" to-layer="367" to-port="0" />
|
| <edge from-layer="366" from-port="0" to-layer="367" to-port="1" />
|
| <edge from-layer="367" from-port="2" to-layer="369" to-port="0" />
|
| <edge from-layer="368" from-port="0" to-layer="369" to-port="1" />
|
| <edge from-layer="369" from-port="2" to-layer="371" to-port="0" />
|
| <edge from-layer="369" from-port="2" to-layer="399" to-port="1" />
|
| <edge from-layer="370" from-port="0" to-layer="371" to-port="1" />
|
| <edge from-layer="371" from-port="2" to-layer="376" to-port="0" />
|
| <edge from-layer="372" from-port="0" to-layer="376" to-port="1" />
|
| <edge from-layer="373" from-port="0" to-layer="376" to-port="2" />
|
| <edge from-layer="374" from-port="0" to-layer="376" to-port="3" />
|
| <edge from-layer="375" from-port="0" to-layer="376" to-port="4" />
|
| <edge from-layer="376" from-port="5" to-layer="381" to-port="0" />
|
| <edge from-layer="377" from-port="0" to-layer="378" to-port="0" />
|
| <edge from-layer="378" from-port="1" to-layer="380" to-port="0" />
|
| <edge from-layer="379" from-port="0" to-layer="380" to-port="1" />
|
| <edge from-layer="380" from-port="2" to-layer="381" to-port="1" />
|
| <edge from-layer="381" from-port="2" to-layer="383" to-port="0" />
|
| <edge from-layer="382" from-port="0" to-layer="383" to-port="1" />
|
| <edge from-layer="383" from-port="2" to-layer="384" to-port="0" />
|
| <edge from-layer="384" from-port="1" to-layer="386" to-port="0" />
|
| <edge from-layer="385" from-port="0" to-layer="386" to-port="1" />
|
| <edge from-layer="386" from-port="2" to-layer="391" to-port="0" />
|
| <edge from-layer="387" from-port="0" to-layer="391" to-port="1" />
|
| <edge from-layer="388" from-port="0" to-layer="391" to-port="2" />
|
| <edge from-layer="389" from-port="0" to-layer="391" to-port="3" />
|
| <edge from-layer="390" from-port="0" to-layer="391" to-port="4" />
|
| <edge from-layer="391" from-port="5" to-layer="396" to-port="0" />
|
| <edge from-layer="392" from-port="0" to-layer="393" to-port="0" />
|
| <edge from-layer="393" from-port="1" to-layer="395" to-port="0" />
|
| <edge from-layer="394" from-port="0" to-layer="395" to-port="1" />
|
| <edge from-layer="395" from-port="2" to-layer="396" to-port="1" />
|
| <edge from-layer="396" from-port="2" to-layer="398" to-port="0" />
|
| <edge from-layer="397" from-port="0" to-layer="398" to-port="1" />
|
| <edge from-layer="398" from-port="2" to-layer="399" to-port="0" />
|
| <edge from-layer="399" from-port="2" to-layer="401" to-port="0" />
|
| <edge from-layer="400" from-port="0" to-layer="401" to-port="1" />
|
| <edge from-layer="401" from-port="2" to-layer="403" to-port="0" />
|
| <edge from-layer="402" from-port="0" to-layer="403" to-port="1" />
|
| <edge from-layer="403" from-port="2" to-layer="405" to-port="0" />
|
| <edge from-layer="404" from-port="0" to-layer="405" to-port="1" />
|
| <edge from-layer="405" from-port="2" to-layer="407" to-port="0" />
|
| <edge from-layer="405" from-port="2" to-layer="475" to-port="1" />
|
| <edge from-layer="406" from-port="0" to-layer="407" to-port="1" />
|
| <edge from-layer="407" from-port="2" to-layer="412" to-port="0" />
|
| <edge from-layer="408" from-port="0" to-layer="412" to-port="1" />
|
| <edge from-layer="409" from-port="0" to-layer="412" to-port="2" />
|
| <edge from-layer="410" from-port="0" to-layer="412" to-port="3" />
|
| <edge from-layer="411" from-port="0" to-layer="412" to-port="4" />
|
| <edge from-layer="412" from-port="5" to-layer="417" to-port="0" />
|
| <edge from-layer="412" from-port="5" to-layer="433" to-port="0" />
|
| <edge from-layer="412" from-port="5" to-layer="449" to-port="0" />
|
| <edge from-layer="413" from-port="0" to-layer="414" to-port="0" />
|
| <edge from-layer="414" from-port="1" to-layer="416" to-port="0" />
|
| <edge from-layer="415" from-port="0" to-layer="416" to-port="1" />
|
| <edge from-layer="416" from-port="2" to-layer="417" to-port="1" />
|
| <edge from-layer="417" from-port="2" to-layer="419" to-port="0" />
|
| <edge from-layer="418" from-port="0" to-layer="419" to-port="1" />
|
| <edge from-layer="419" from-port="2" to-layer="424" to-port="0" />
|
| <edge from-layer="420" from-port="0" to-layer="424" to-port="1" />
|
| <edge from-layer="421" from-port="0" to-layer="424" to-port="2" />
|
| <edge from-layer="422" from-port="0" to-layer="424" to-port="3" />
|
| <edge from-layer="423" from-port="0" to-layer="424" to-port="4" />
|
| <edge from-layer="424" from-port="5" to-layer="426" to-port="0" />
|
| <edge from-layer="425" from-port="0" to-layer="426" to-port="1" />
|
| <edge from-layer="426" from-port="2" to-layer="428" to-port="0" />
|
| <edge from-layer="427" from-port="0" to-layer="428" to-port="1" />
|
| <edge from-layer="428" from-port="2" to-layer="456" to-port="0" />
|
| <edge from-layer="429" from-port="0" to-layer="430" to-port="0" />
|
| <edge from-layer="430" from-port="1" to-layer="432" to-port="0" />
|
| <edge from-layer="431" from-port="0" to-layer="432" to-port="1" />
|
| <edge from-layer="432" from-port="2" to-layer="433" to-port="1" />
|
| <edge from-layer="433" from-port="2" to-layer="435" to-port="0" />
|
| <edge from-layer="434" from-port="0" to-layer="435" to-port="1" />
|
| <edge from-layer="435" from-port="2" to-layer="440" to-port="0" />
|
| <edge from-layer="436" from-port="0" to-layer="440" to-port="1" />
|
| <edge from-layer="437" from-port="0" to-layer="440" to-port="2" />
|
| <edge from-layer="438" from-port="0" to-layer="440" to-port="3" />
|
| <edge from-layer="439" from-port="0" to-layer="440" to-port="4" />
|
| <edge from-layer="440" from-port="5" to-layer="442" to-port="0" />
|
| <edge from-layer="441" from-port="0" to-layer="442" to-port="1" />
|
| <edge from-layer="442" from-port="2" to-layer="444" to-port="0" />
|
| <edge from-layer="443" from-port="0" to-layer="444" to-port="1" />
|
| <edge from-layer="444" from-port="2" to-layer="456" to-port="1" />
|
| <edge from-layer="445" from-port="0" to-layer="446" to-port="0" />
|
| <edge from-layer="446" from-port="1" to-layer="448" to-port="0" />
|
| <edge from-layer="447" from-port="0" to-layer="448" to-port="1" />
|
| <edge from-layer="448" from-port="2" to-layer="449" to-port="1" />
|
| <edge from-layer="449" from-port="2" to-layer="451" to-port="0" />
|
| <edge from-layer="450" from-port="0" to-layer="451" to-port="1" />
|
| <edge from-layer="451" from-port="2" to-layer="453" to-port="0" />
|
| <edge from-layer="452" from-port="0" to-layer="453" to-port="1" />
|
| <edge from-layer="453" from-port="2" to-layer="455" to-port="0" />
|
| <edge from-layer="454" from-port="0" to-layer="455" to-port="1" />
|
| <edge from-layer="455" from-port="2" to-layer="456" to-port="2" />
|
| <edge from-layer="456" from-port="4" to-layer="458" to-port="0" />
|
| <edge from-layer="457" from-port="0" to-layer="458" to-port="1" />
|
| <edge from-layer="458" from-port="2" to-layer="460" to-port="0" />
|
| <edge from-layer="459" from-port="0" to-layer="460" to-port="1" />
|
| <edge from-layer="460" from-port="2" to-layer="462" to-port="0" />
|
| <edge from-layer="461" from-port="0" to-layer="462" to-port="1" />
|
| <edge from-layer="462" from-port="2" to-layer="467" to-port="0" />
|
| <edge from-layer="463" from-port="0" to-layer="467" to-port="1" />
|
| <edge from-layer="464" from-port="0" to-layer="467" to-port="2" />
|
| <edge from-layer="465" from-port="0" to-layer="467" to-port="3" />
|
| <edge from-layer="466" from-port="0" to-layer="467" to-port="4" />
|
| <edge from-layer="467" from-port="5" to-layer="472" to-port="0" />
|
| <edge from-layer="468" from-port="0" to-layer="469" to-port="0" />
|
| <edge from-layer="469" from-port="1" to-layer="471" to-port="0" />
|
| <edge from-layer="470" from-port="0" to-layer="471" to-port="1" />
|
| <edge from-layer="471" from-port="2" to-layer="472" to-port="1" />
|
| <edge from-layer="472" from-port="2" to-layer="474" to-port="0" />
|
| <edge from-layer="473" from-port="0" to-layer="474" to-port="1" />
|
| <edge from-layer="474" from-port="2" to-layer="475" to-port="0" />
|
| <edge from-layer="475" from-port="2" to-layer="477" to-port="0" />
|
| <edge from-layer="476" from-port="0" to-layer="477" to-port="1" />
|
| <edge from-layer="477" from-port="2" to-layer="479" to-port="0" />
|
| <edge from-layer="478" from-port="0" to-layer="479" to-port="1" />
|
| <edge from-layer="479" from-port="2" to-layer="481" to-port="0" />
|
| <edge from-layer="480" from-port="0" to-layer="481" to-port="1" />
|
| <edge from-layer="481" from-port="2" to-layer="483" to-port="0" />
|
| <edge from-layer="481" from-port="2" to-layer="511" to-port="1" />
|
| <edge from-layer="482" from-port="0" to-layer="483" to-port="1" />
|
| <edge from-layer="483" from-port="2" to-layer="488" to-port="0" />
|
| <edge from-layer="484" from-port="0" to-layer="488" to-port="1" />
|
| <edge from-layer="485" from-port="0" to-layer="488" to-port="2" />
|
| <edge from-layer="486" from-port="0" to-layer="488" to-port="3" />
|
| <edge from-layer="487" from-port="0" to-layer="488" to-port="4" />
|
| <edge from-layer="488" from-port="5" to-layer="493" to-port="0" />
|
| <edge from-layer="489" from-port="0" to-layer="490" to-port="0" />
|
| <edge from-layer="490" from-port="1" to-layer="492" to-port="0" />
|
| <edge from-layer="491" from-port="0" to-layer="492" to-port="1" />
|
| <edge from-layer="492" from-port="2" to-layer="493" to-port="1" />
|
| <edge from-layer="493" from-port="2" to-layer="495" to-port="0" />
|
| <edge from-layer="494" from-port="0" to-layer="495" to-port="1" />
|
| <edge from-layer="495" from-port="2" to-layer="496" to-port="0" />
|
| <edge from-layer="496" from-port="1" to-layer="498" to-port="0" />
|
| <edge from-layer="497" from-port="0" to-layer="498" to-port="1" />
|
| <edge from-layer="498" from-port="2" to-layer="503" to-port="0" />
|
| <edge from-layer="499" from-port="0" to-layer="503" to-port="1" />
|
| <edge from-layer="500" from-port="0" to-layer="503" to-port="2" />
|
| <edge from-layer="501" from-port="0" to-layer="503" to-port="3" />
|
| <edge from-layer="502" from-port="0" to-layer="503" to-port="4" />
|
| <edge from-layer="503" from-port="5" to-layer="508" to-port="0" />
|
| <edge from-layer="504" from-port="0" to-layer="505" to-port="0" />
|
| <edge from-layer="505" from-port="1" to-layer="507" to-port="0" />
|
| <edge from-layer="506" from-port="0" to-layer="507" to-port="1" />
|
| <edge from-layer="507" from-port="2" to-layer="508" to-port="1" />
|
| <edge from-layer="508" from-port="2" to-layer="510" to-port="0" />
|
| <edge from-layer="509" from-port="0" to-layer="510" to-port="1" />
|
| <edge from-layer="510" from-port="2" to-layer="511" to-port="0" />
|
| <edge from-layer="511" from-port="2" to-layer="513" to-port="0" />
|
| <edge from-layer="512" from-port="0" to-layer="513" to-port="1" />
|
| <edge from-layer="513" from-port="2" to-layer="515" to-port="0" />
|
| <edge from-layer="514" from-port="0" to-layer="515" to-port="1" />
|
| <edge from-layer="515" from-port="2" to-layer="517" to-port="0" />
|
| <edge from-layer="516" from-port="0" to-layer="517" to-port="1" />
|
| <edge from-layer="517" from-port="2" to-layer="587" to-port="1" />
|
| <edge from-layer="517" from-port="2" to-layer="519" to-port="0" />
|
| <edge from-layer="518" from-port="0" to-layer="519" to-port="1" />
|
| <edge from-layer="519" from-port="2" to-layer="524" to-port="0" />
|
| <edge from-layer="520" from-port="0" to-layer="524" to-port="1" />
|
| <edge from-layer="521" from-port="0" to-layer="524" to-port="2" />
|
| <edge from-layer="522" from-port="0" to-layer="524" to-port="3" />
|
| <edge from-layer="523" from-port="0" to-layer="524" to-port="4" />
|
| <edge from-layer="524" from-port="5" to-layer="529" to-port="0" />
|
| <edge from-layer="524" from-port="5" to-layer="545" to-port="0" />
|
| <edge from-layer="524" from-port="5" to-layer="561" to-port="0" />
|
| <edge from-layer="525" from-port="0" to-layer="526" to-port="0" />
|
| <edge from-layer="526" from-port="1" to-layer="528" to-port="0" />
|
| <edge from-layer="527" from-port="0" to-layer="528" to-port="1" />
|
| <edge from-layer="528" from-port="2" to-layer="529" to-port="1" />
|
| <edge from-layer="529" from-port="2" to-layer="531" to-port="0" />
|
| <edge from-layer="530" from-port="0" to-layer="531" to-port="1" />
|
| <edge from-layer="531" from-port="2" to-layer="536" to-port="0" />
|
| <edge from-layer="532" from-port="0" to-layer="536" to-port="1" />
|
| <edge from-layer="533" from-port="0" to-layer="536" to-port="2" />
|
| <edge from-layer="534" from-port="0" to-layer="536" to-port="3" />
|
| <edge from-layer="535" from-port="0" to-layer="536" to-port="4" />
|
| <edge from-layer="536" from-port="5" to-layer="538" to-port="0" />
|
| <edge from-layer="537" from-port="0" to-layer="538" to-port="1" />
|
| <edge from-layer="538" from-port="2" to-layer="540" to-port="0" />
|
| <edge from-layer="539" from-port="0" to-layer="540" to-port="1" />
|
| <edge from-layer="540" from-port="2" to-layer="568" to-port="0" />
|
| <edge from-layer="541" from-port="0" to-layer="542" to-port="0" />
|
| <edge from-layer="542" from-port="1" to-layer="544" to-port="0" />
|
| <edge from-layer="543" from-port="0" to-layer="544" to-port="1" />
|
| <edge from-layer="544" from-port="2" to-layer="545" to-port="1" />
|
| <edge from-layer="545" from-port="2" to-layer="547" to-port="0" />
|
| <edge from-layer="546" from-port="0" to-layer="547" to-port="1" />
|
| <edge from-layer="547" from-port="2" to-layer="552" to-port="0" />
|
| <edge from-layer="548" from-port="0" to-layer="552" to-port="1" />
|
| <edge from-layer="549" from-port="0" to-layer="552" to-port="2" />
|
| <edge from-layer="550" from-port="0" to-layer="552" to-port="3" />
|
| <edge from-layer="551" from-port="0" to-layer="552" to-port="4" />
|
| <edge from-layer="552" from-port="5" to-layer="554" to-port="0" />
|
| <edge from-layer="553" from-port="0" to-layer="554" to-port="1" />
|
| <edge from-layer="554" from-port="2" to-layer="556" to-port="0" />
|
| <edge from-layer="555" from-port="0" to-layer="556" to-port="1" />
|
| <edge from-layer="556" from-port="2" to-layer="568" to-port="1" />
|
| <edge from-layer="557" from-port="0" to-layer="558" to-port="0" />
|
| <edge from-layer="558" from-port="1" to-layer="560" to-port="0" />
|
| <edge from-layer="559" from-port="0" to-layer="560" to-port="1" />
|
| <edge from-layer="560" from-port="2" to-layer="561" to-port="1" />
|
| <edge from-layer="561" from-port="2" to-layer="563" to-port="0" />
|
| <edge from-layer="562" from-port="0" to-layer="563" to-port="1" />
|
| <edge from-layer="563" from-port="2" to-layer="565" to-port="0" />
|
| <edge from-layer="564" from-port="0" to-layer="565" to-port="1" />
|
| <edge from-layer="565" from-port="2" to-layer="567" to-port="0" />
|
| <edge from-layer="566" from-port="0" to-layer="567" to-port="1" />
|
| <edge from-layer="567" from-port="2" to-layer="568" to-port="2" />
|
| <edge from-layer="568" from-port="4" to-layer="570" to-port="0" />
|
| <edge from-layer="569" from-port="0" to-layer="570" to-port="1" />
|
| <edge from-layer="570" from-port="2" to-layer="572" to-port="0" />
|
| <edge from-layer="571" from-port="0" to-layer="572" to-port="1" />
|
| <edge from-layer="572" from-port="2" to-layer="574" to-port="0" />
|
| <edge from-layer="573" from-port="0" to-layer="574" to-port="1" />
|
| <edge from-layer="574" from-port="2" to-layer="579" to-port="0" />
|
| <edge from-layer="575" from-port="0" to-layer="579" to-port="1" />
|
| <edge from-layer="576" from-port="0" to-layer="579" to-port="2" />
|
| <edge from-layer="577" from-port="0" to-layer="579" to-port="3" />
|
| <edge from-layer="578" from-port="0" to-layer="579" to-port="4" />
|
| <edge from-layer="579" from-port="5" to-layer="584" to-port="0" />
|
| <edge from-layer="580" from-port="0" to-layer="581" to-port="0" />
|
| <edge from-layer="581" from-port="1" to-layer="583" to-port="0" />
|
| <edge from-layer="582" from-port="0" to-layer="583" to-port="1" />
|
| <edge from-layer="583" from-port="2" to-layer="584" to-port="1" />
|
| <edge from-layer="584" from-port="2" to-layer="586" to-port="0" />
|
| <edge from-layer="585" from-port="0" to-layer="586" to-port="1" />
|
| <edge from-layer="586" from-port="2" to-layer="587" to-port="0" />
|
| <edge from-layer="587" from-port="2" to-layer="589" to-port="0" />
|
| <edge from-layer="588" from-port="0" to-layer="589" to-port="1" />
|
| <edge from-layer="589" from-port="2" to-layer="591" to-port="0" />
|
| <edge from-layer="590" from-port="0" to-layer="591" to-port="1" />
|
| <edge from-layer="591" from-port="2" to-layer="593" to-port="0" />
|
| <edge from-layer="592" from-port="0" to-layer="593" to-port="1" />
|
| <edge from-layer="593" from-port="2" to-layer="595" to-port="0" />
|
| <edge from-layer="593" from-port="2" to-layer="623" to-port="1" />
|
| <edge from-layer="594" from-port="0" to-layer="595" to-port="1" />
|
| <edge from-layer="595" from-port="2" to-layer="600" to-port="0" />
|
| <edge from-layer="596" from-port="0" to-layer="600" to-port="1" />
|
| <edge from-layer="597" from-port="0" to-layer="600" to-port="2" />
|
| <edge from-layer="598" from-port="0" to-layer="600" to-port="3" />
|
| <edge from-layer="599" from-port="0" to-layer="600" to-port="4" />
|
| <edge from-layer="600" from-port="5" to-layer="605" to-port="0" />
|
| <edge from-layer="601" from-port="0" to-layer="602" to-port="0" />
|
| <edge from-layer="602" from-port="1" to-layer="604" to-port="0" />
|
| <edge from-layer="603" from-port="0" to-layer="604" to-port="1" />
|
| <edge from-layer="604" from-port="2" to-layer="605" to-port="1" />
|
| <edge from-layer="605" from-port="2" to-layer="607" to-port="0" />
|
| <edge from-layer="606" from-port="0" to-layer="607" to-port="1" />
|
| <edge from-layer="607" from-port="2" to-layer="608" to-port="0" />
|
| <edge from-layer="608" from-port="1" to-layer="610" to-port="0" />
|
| <edge from-layer="609" from-port="0" to-layer="610" to-port="1" />
|
| <edge from-layer="610" from-port="2" to-layer="615" to-port="0" />
|
| <edge from-layer="611" from-port="0" to-layer="615" to-port="1" />
|
| <edge from-layer="612" from-port="0" to-layer="615" to-port="2" />
|
| <edge from-layer="613" from-port="0" to-layer="615" to-port="3" />
|
| <edge from-layer="614" from-port="0" to-layer="615" to-port="4" />
|
| <edge from-layer="615" from-port="5" to-layer="620" to-port="0" />
|
| <edge from-layer="616" from-port="0" to-layer="617" to-port="0" />
|
| <edge from-layer="617" from-port="1" to-layer="619" to-port="0" />
|
| <edge from-layer="618" from-port="0" to-layer="619" to-port="1" />
|
| <edge from-layer="619" from-port="2" to-layer="620" to-port="1" />
|
| <edge from-layer="620" from-port="2" to-layer="622" to-port="0" />
|
| <edge from-layer="621" from-port="0" to-layer="622" to-port="1" />
|
| <edge from-layer="622" from-port="2" to-layer="623" to-port="0" />
|
| <edge from-layer="623" from-port="2" to-layer="625" to-port="0" />
|
| <edge from-layer="624" from-port="0" to-layer="625" to-port="1" />
|
| <edge from-layer="625" from-port="2" to-layer="627" to-port="0" />
|
| <edge from-layer="626" from-port="0" to-layer="627" to-port="1" />
|
| <edge from-layer="627" from-port="2" to-layer="629" to-port="0" />
|
| <edge from-layer="628" from-port="0" to-layer="629" to-port="1" />
|
| <edge from-layer="629" from-port="2" to-layer="631" to-port="0" />
|
| <edge from-layer="629" from-port="2" to-layer="699" to-port="1" />
|
| <edge from-layer="630" from-port="0" to-layer="631" to-port="1" />
|
| <edge from-layer="631" from-port="2" to-layer="636" to-port="0" />
|
| <edge from-layer="632" from-port="0" to-layer="636" to-port="1" />
|
| <edge from-layer="633" from-port="0" to-layer="636" to-port="2" />
|
| <edge from-layer="634" from-port="0" to-layer="636" to-port="3" />
|
| <edge from-layer="635" from-port="0" to-layer="636" to-port="4" />
|
| <edge from-layer="636" from-port="5" to-layer="641" to-port="0" />
|
| <edge from-layer="636" from-port="5" to-layer="657" to-port="0" />
|
| <edge from-layer="636" from-port="5" to-layer="673" to-port="0" />
|
| <edge from-layer="637" from-port="0" to-layer="638" to-port="0" />
|
| <edge from-layer="638" from-port="1" to-layer="640" to-port="0" />
|
| <edge from-layer="639" from-port="0" to-layer="640" to-port="1" />
|
| <edge from-layer="640" from-port="2" to-layer="641" to-port="1" />
|
| <edge from-layer="641" from-port="2" to-layer="643" to-port="0" />
|
| <edge from-layer="642" from-port="0" to-layer="643" to-port="1" />
|
| <edge from-layer="643" from-port="2" to-layer="648" to-port="0" />
|
| <edge from-layer="644" from-port="0" to-layer="648" to-port="1" />
|
| <edge from-layer="645" from-port="0" to-layer="648" to-port="2" />
|
| <edge from-layer="646" from-port="0" to-layer="648" to-port="3" />
|
| <edge from-layer="647" from-port="0" to-layer="648" to-port="4" />
|
| <edge from-layer="648" from-port="5" to-layer="650" to-port="0" />
|
| <edge from-layer="649" from-port="0" to-layer="650" to-port="1" />
|
| <edge from-layer="650" from-port="2" to-layer="652" to-port="0" />
|
| <edge from-layer="651" from-port="0" to-layer="652" to-port="1" />
|
| <edge from-layer="652" from-port="2" to-layer="680" to-port="0" />
|
| <edge from-layer="653" from-port="0" to-layer="654" to-port="0" />
|
| <edge from-layer="654" from-port="1" to-layer="656" to-port="0" />
|
| <edge from-layer="655" from-port="0" to-layer="656" to-port="1" />
|
| <edge from-layer="656" from-port="2" to-layer="657" to-port="1" />
|
| <edge from-layer="657" from-port="2" to-layer="659" to-port="0" />
|
| <edge from-layer="658" from-port="0" to-layer="659" to-port="1" />
|
| <edge from-layer="659" from-port="2" to-layer="664" to-port="0" />
|
| <edge from-layer="660" from-port="0" to-layer="664" to-port="1" />
|
| <edge from-layer="661" from-port="0" to-layer="664" to-port="2" />
|
| <edge from-layer="662" from-port="0" to-layer="664" to-port="3" />
|
| <edge from-layer="663" from-port="0" to-layer="664" to-port="4" />
|
| <edge from-layer="664" from-port="5" to-layer="666" to-port="0" />
|
| <edge from-layer="665" from-port="0" to-layer="666" to-port="1" />
|
| <edge from-layer="666" from-port="2" to-layer="668" to-port="0" />
|
| <edge from-layer="667" from-port="0" to-layer="668" to-port="1" />
|
| <edge from-layer="668" from-port="2" to-layer="680" to-port="1" />
|
| <edge from-layer="669" from-port="0" to-layer="670" to-port="0" />
|
| <edge from-layer="670" from-port="1" to-layer="672" to-port="0" />
|
| <edge from-layer="671" from-port="0" to-layer="672" to-port="1" />
|
| <edge from-layer="672" from-port="2" to-layer="673" to-port="1" />
|
| <edge from-layer="673" from-port="2" to-layer="675" to-port="0" />
|
| <edge from-layer="674" from-port="0" to-layer="675" to-port="1" />
|
| <edge from-layer="675" from-port="2" to-layer="677" to-port="0" />
|
| <edge from-layer="676" from-port="0" to-layer="677" to-port="1" />
|
| <edge from-layer="677" from-port="2" to-layer="679" to-port="0" />
|
| <edge from-layer="678" from-port="0" to-layer="679" to-port="1" />
|
| <edge from-layer="679" from-port="2" to-layer="680" to-port="2" />
|
| <edge from-layer="680" from-port="4" to-layer="682" to-port="0" />
|
| <edge from-layer="681" from-port="0" to-layer="682" to-port="1" />
|
| <edge from-layer="682" from-port="2" to-layer="684" to-port="0" />
|
| <edge from-layer="683" from-port="0" to-layer="684" to-port="1" />
|
| <edge from-layer="684" from-port="2" to-layer="686" to-port="0" />
|
| <edge from-layer="685" from-port="0" to-layer="686" to-port="1" />
|
| <edge from-layer="686" from-port="2" to-layer="691" to-port="0" />
|
| <edge from-layer="687" from-port="0" to-layer="691" to-port="1" />
|
| <edge from-layer="688" from-port="0" to-layer="691" to-port="2" />
|
| <edge from-layer="689" from-port="0" to-layer="691" to-port="3" />
|
| <edge from-layer="690" from-port="0" to-layer="691" to-port="4" />
|
| <edge from-layer="691" from-port="5" to-layer="696" to-port="0" />
|
| <edge from-layer="692" from-port="0" to-layer="693" to-port="0" />
|
| <edge from-layer="693" from-port="1" to-layer="695" to-port="0" />
|
| <edge from-layer="694" from-port="0" to-layer="695" to-port="1" />
|
| <edge from-layer="695" from-port="2" to-layer="696" to-port="1" />
|
| <edge from-layer="696" from-port="2" to-layer="698" to-port="0" />
|
| <edge from-layer="697" from-port="0" to-layer="698" to-port="1" />
|
| <edge from-layer="698" from-port="2" to-layer="699" to-port="0" />
|
| <edge from-layer="699" from-port="2" to-layer="701" to-port="0" />
|
| <edge from-layer="700" from-port="0" to-layer="701" to-port="1" />
|
| <edge from-layer="701" from-port="2" to-layer="703" to-port="0" />
|
| <edge from-layer="702" from-port="0" to-layer="703" to-port="1" />
|
| <edge from-layer="703" from-port="2" to-layer="705" to-port="0" />
|
| <edge from-layer="704" from-port="0" to-layer="705" to-port="1" />
|
| <edge from-layer="705" from-port="2" to-layer="707" to-port="0" />
|
| <edge from-layer="705" from-port="2" to-layer="735" to-port="1" />
|
| <edge from-layer="706" from-port="0" to-layer="707" to-port="1" />
|
| <edge from-layer="707" from-port="2" to-layer="712" to-port="0" />
|
| <edge from-layer="708" from-port="0" to-layer="712" to-port="1" />
|
| <edge from-layer="709" from-port="0" to-layer="712" to-port="2" />
|
| <edge from-layer="710" from-port="0" to-layer="712" to-port="3" />
|
| <edge from-layer="711" from-port="0" to-layer="712" to-port="4" />
|
| <edge from-layer="712" from-port="5" to-layer="717" to-port="0" />
|
| <edge from-layer="713" from-port="0" to-layer="714" to-port="0" />
|
| <edge from-layer="714" from-port="1" to-layer="716" to-port="0" />
|
| <edge from-layer="715" from-port="0" to-layer="716" to-port="1" />
|
| <edge from-layer="716" from-port="2" to-layer="717" to-port="1" />
|
| <edge from-layer="717" from-port="2" to-layer="719" to-port="0" />
|
| <edge from-layer="718" from-port="0" to-layer="719" to-port="1" />
|
| <edge from-layer="719" from-port="2" to-layer="720" to-port="0" />
|
| <edge from-layer="720" from-port="1" to-layer="722" to-port="0" />
|
| <edge from-layer="721" from-port="0" to-layer="722" to-port="1" />
|
| <edge from-layer="722" from-port="2" to-layer="727" to-port="0" />
|
| <edge from-layer="723" from-port="0" to-layer="727" to-port="1" />
|
| <edge from-layer="724" from-port="0" to-layer="727" to-port="2" />
|
| <edge from-layer="725" from-port="0" to-layer="727" to-port="3" />
|
| <edge from-layer="726" from-port="0" to-layer="727" to-port="4" />
|
| <edge from-layer="727" from-port="5" to-layer="732" to-port="0" />
|
| <edge from-layer="728" from-port="0" to-layer="729" to-port="0" />
|
| <edge from-layer="729" from-port="1" to-layer="731" to-port="0" />
|
| <edge from-layer="730" from-port="0" to-layer="731" to-port="1" />
|
| <edge from-layer="731" from-port="2" to-layer="732" to-port="1" />
|
| <edge from-layer="732" from-port="2" to-layer="734" to-port="0" />
|
| <edge from-layer="733" from-port="0" to-layer="734" to-port="1" />
|
| <edge from-layer="734" from-port="2" to-layer="735" to-port="0" />
|
| <edge from-layer="735" from-port="2" to-layer="737" to-port="0" />
|
| <edge from-layer="736" from-port="0" to-layer="737" to-port="1" />
|
| <edge from-layer="737" from-port="2" to-layer="739" to-port="0" />
|
| <edge from-layer="738" from-port="0" to-layer="739" to-port="1" />
|
| <edge from-layer="739" from-port="2" to-layer="741" to-port="0" />
|
| <edge from-layer="740" from-port="0" to-layer="741" to-port="1" />
|
| <edge from-layer="741" from-port="2" to-layer="744" to-port="0" />
|
| <edge from-layer="742" from-port="0" to-layer="744" to-port="1" />
|
| <edge from-layer="743" from-port="0" to-layer="744" to-port="2" />
|
| <edge from-layer="744" from-port="3" to-layer="746" to-port="0" />
|
| <edge from-layer="745" from-port="0" to-layer="746" to-port="1" />
|
| <edge from-layer="746" from-port="2" to-layer="751" to-port="0" />
|
| <edge from-layer="747" from-port="0" to-layer="751" to-port="1" />
|
| <edge from-layer="748" from-port="0" to-layer="751" to-port="2" />
|
| <edge from-layer="749" from-port="0" to-layer="751" to-port="3" />
|
| <edge from-layer="750" from-port="0" to-layer="751" to-port="4" />
|
| <edge from-layer="751" from-port="5" to-layer="756" to-port="0" />
|
| <edge from-layer="752" from-port="0" to-layer="753" to-port="0" />
|
| <edge from-layer="753" from-port="1" to-layer="755" to-port="0" />
|
| <edge from-layer="754" from-port="0" to-layer="755" to-port="1" />
|
| <edge from-layer="755" from-port="2" to-layer="756" to-port="1" />
|
| <edge from-layer="756" from-port="2" to-layer="758" to-port="0" />
|
| <edge from-layer="757" from-port="0" to-layer="758" to-port="1" />
|
| <edge from-layer="758" from-port="2" to-layer="759" to-port="0" />
|
| <edge from-layer="759" from-port="1" to-layer="761" to-port="0" />
|
| <edge from-layer="760" from-port="0" to-layer="761" to-port="1" />
|
| <edge from-layer="761" from-port="2" to-layer="766" to-port="0" />
|
| <edge from-layer="762" from-port="0" to-layer="766" to-port="1" />
|
| <edge from-layer="763" from-port="0" to-layer="766" to-port="2" />
|
| <edge from-layer="764" from-port="0" to-layer="766" to-port="3" />
|
| <edge from-layer="765" from-port="0" to-layer="766" to-port="4" />
|
| <edge from-layer="766" from-port="5" to-layer="771" to-port="0" />
|
| <edge from-layer="767" from-port="0" to-layer="768" to-port="0" />
|
| <edge from-layer="768" from-port="1" to-layer="770" to-port="0" />
|
| <edge from-layer="769" from-port="0" to-layer="770" to-port="1" />
|
| <edge from-layer="770" from-port="2" to-layer="771" to-port="1" />
|
| <edge from-layer="771" from-port="2" to-layer="773" to-port="0" />
|
| <edge from-layer="772" from-port="0" to-layer="773" to-port="1" />
|
| <edge from-layer="773" from-port="2" to-layer="774" to-port="0" />
|
| </edges>
|
| <rt_info>
|
| <Runtime_version value="2024.4.1-16618-643f23d1318-releases/2024/4" />
|
| <conversion_parameters>
|
| <framework value="pytorch" />
|
| <is_python_object value="True" />
|
| </conversion_parameters>
|
| <nncf>
|
| <friendly_names_were_updated value="True" />
|
| <quantization>
|
| <advanced_parameters value="{'overflow_fix': 'disable', 'quantize_outputs': False, 'inplace_statistics': True, 'disable_channel_alignment': True, 'disable_bias_correction': False, 'batchwise_statistics': None, 'activations_quantization_params': None, 'weights_quantization_params': None, 'activations_range_estimator_params': {'min': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}, 'max': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}}, 'weights_range_estimator_params': {'min': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}, 'max': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}}, 'bias_correction_params': {'apply_for_all_nodes': False, 'threshold': None}, 'smooth_quant_alphas': {'convolution': -1, 'matmul': 0.95}, 'smooth_quant_alpha': None, 'backend_params': {}}" />
|
| <fast_bias_correction value="True" />
|
| <ignored_scope>
|
| <types value="['GroupNormalization']" />
|
| </ignored_scope>
|
| <model_type value="transformer" />
|
| <preset value="mixed" />
|
| <subset_size value="300" />
|
| <target_device value="ANY" />
|
| </quantization>
|
| </nncf>
|
| <optimum>
|
| <optimum_intel_version value="1.20.1" />
|
| <optimum_version value="1.24.0" />
|
| <pytorch_version value="2.6.0+cu124" />
|
| <transformers_version value="4.52.0.dev0" />
|
| </optimum>
|
| </rt_info>
|
| </net>
|
|
|