| <?xml version="1.0"?>
|
| <net name="Model0" version="11">
|
| <layers>
|
| <layer id="0" name="pixel_values" type="Parameter" version="opset1">
|
| <data shape="?,?,?,?" element_type="f32" />
|
| <output>
|
| <port id="0" precision="FP32" names="39,input.1,pixel_values">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="1" name="self.embeddings.class_embedding_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="0" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.embeddings.class_embedding">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="2" name="self.embeddings.class_embedding" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="3" name="self.embeddings.patch_embedding.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3, 16, 16" offset="1536" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.embeddings.patch_embedding.weight">
|
| <dim>768</dim>
|
| <dim>3</dim>
|
| <dim>16</dim>
|
| <dim>16</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="4" name="self.embeddings.patch_embedding.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3</dim>
|
| <dim>16</dim>
|
| <dim>16</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3</dim>
|
| <dim>16</dim>
|
| <dim>16</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="5" name="__module.embeddings.patch_embedding/aten::_convolution/Convolution" type="Convolution" version="opset1">
|
| <data strides="16, 16" dilations="1, 1" pads_begin="0, 0" pads_end="0, 0" auto_pad="explicit" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3</dim>
|
| <dim>16</dim>
|
| <dim>16</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="6" name="__module.embeddings.patch_embedding/aten::_convolution/Reshape_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 768, 1, 1" offset="1181184" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="7" name="__module.embeddings.patch_embedding/aten::_convolution/Reshape" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="8" name="__module.embeddings.patch_embedding/aten::_convolution/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="46,patch_embeds.1">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="9" name="ShapeOf_10114" type="ShapeOf" version="opset3">
|
| <data output_type="i64" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="10" name="Constant_10115" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="1182720" size="8" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="11" name="Constant_10116" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="1182720" size="8" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64" />
|
| </output>
|
| </layer>
|
| <layer id="12" name="Gather_10117" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="I64" names="38">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="13" name="Constant_8687" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="1182728" size="8" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="14" name="Constant_8689" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="1182728" size="8" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="15" name="__module.embeddings/prim::ListConstruct" type="Concat" version="opset1">
|
| <data axis="0" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="2" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="3" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="16" name="__module.embeddings/aten::expand/Broadcast" type="Broadcast" version="opset3">
|
| <data mode="bidirectional" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="50,51,class_embeds">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="17" name="Constant_10202" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="1182736" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="18" name="__module.embeddings/aten::flatten/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="47">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| <dim>-1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="19" name="__module.embeddings/aten::transpose/Constant" type="Const" version="opset1">
|
| <data element_type="i32" shape="3" offset="1182760" size="12" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="20" name="__module.embeddings/aten::transpose/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| <dim>-1</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="48,patch_embeds">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="21" name="__module.embeddings/aten::cat/Concat" type="Concat" version="opset1">
|
| <data axis="1" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="53,embeddings.1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="22" name="__module.embeddings/aten::slice/Slice_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 577, 768" offset="1182772" size="886272" />
|
| <output>
|
| <port id="0" precision="FP16" names="55">
|
| <dim>1</dim>
|
| <dim>577</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="23" name="__module.embeddings/aten::slice/Slice" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>577</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>577</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="24" name="Constant_192" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="1182720" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="25" name="ShapeOf_10126" type="ShapeOf" version="opset3">
|
| <data output_type="i64" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="26" name="Constant_10127" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="1182728" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="27" name="Constant_10128" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="1182720" size="8" />
|
| <output>
|
| <port id="0" precision="I64" />
|
| </output>
|
| </layer>
|
| <layer id="28" name="Gather_10129" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="I64" names="54">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="29" name="Constant_195" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="1182728" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="30" name="Constant_190" type="Const" version="opset1">
|
| <data element_type="i64" shape="1" offset="1182728" size="8" />
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="31" name="__module.embeddings/aten::slice/Slice_1" type="Slice" version="opset8">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>1</dim>
|
| <dim>577</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="2" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="3" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| <port id="4" precision="I64">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="56,57,58">
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="32" name="__module.embeddings/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="59,input.3">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="33" name="__module.encoder.layers.0.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="34" name="__module.encoder.layers.0.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="35" name="Constant_9918_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="2069048" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="36" name="Constant_9918" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="37" name="__module.encoder.layers.0.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="38" name="Constant_9919_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="2070584" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="39" name="Constant_9919" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="40" name="__module.encoder.layers.0.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="108,hidden_states.1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="41" name="self.encoder.layers.0.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="2072120" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.0.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="42" name="self.encoder.layers.0.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="43" name="__module.encoder.layers.0.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="44" name="Constant_9920_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="5611064" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="45" name="Constant_9920" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="46" name="__module.encoder.layers.0.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="117">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="47" name="Constant_10203" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="48" name="__module.encoder.layers.0.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="121">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="49" name="Constant_364" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="122">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="50" name="__module.encoder.layers.0.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="123,mixed_qkv.1">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="51" name="75" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="1182720" size="8" />
|
| <output>
|
| <port id="0" precision="I64" names="75" />
|
| </output>
|
| </layer>
|
| <layer id="52" name="__module.encoder.layers.0.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="124,query_states.1">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="53" name="74" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="1182728" size="8" />
|
| <output>
|
| <port id="0" precision="I64" names="74" />
|
| </output>
|
| </layer>
|
| <layer id="54" name="__module.encoder.layers.0.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="125,key_states.1">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="55" name="73" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="5615752" size="8" />
|
| <output>
|
| <port id="0" precision="I64" names="73" />
|
| </output>
|
| </layer>
|
| <layer id="56" name="__module.encoder.layers.0.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="126,value_states.1">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="57" name="Constant_9496_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="58" name="Constant_9496" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="59" name="Constant_220_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615762" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" names="66" />
|
| </output>
|
| </layer>
|
| <layer id="60" name="Constant_220" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="61" name="__module.encoder.layers.0.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="132">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="62" name="Constant_459" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="133">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="63" name="__module.encoder.layers.0.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="134,context_layer.1">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="64" name="__module.encoder.layers.0.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="65" name="__module.encoder.layers.0.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="138,input.9">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="66" name="self.encoder.layers.0.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="5615820" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.0.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="67" name="self.encoder.layers.0.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="68" name="__module.encoder.layers.0.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="69" name="Constant_9921_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="6795468" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="70" name="Constant_9921" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="71" name="__module.encoder.layers.0.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="141,hidden_states.3">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="72" name="__module.encoder.layers.0/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="142,input.11">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="73" name="__module.encoder.layers.0.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="74" name="__module.encoder.layers.0.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="75" name="Constant_9922_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="6797004" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="76" name="Constant_9922" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="77" name="__module.encoder.layers.0.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="78" name="Constant_9923_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="6798540" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="79" name="Constant_9923" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="80" name="__module.encoder.layers.0.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="146,input.13">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="81" name="self.encoder.layers.0.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="6800076" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.0.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="82" name="self.encoder.layers.0.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="83" name="__module.encoder.layers.0.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="84" name="Constant_9924_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="11518668" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="85" name="Constant_9924" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="86" name="__module.encoder.layers.0.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="152,input.15">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="87" name="__module.encoder.layers.0.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="153,input.17">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="88" name="self.encoder.layers.0.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="11524812" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.0.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="89" name="self.encoder.layers.0.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="90" name="__module.encoder.layers.0.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="91" name="Constant_9925_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="16243404" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="92" name="Constant_9925" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="93" name="__module.encoder.layers.0.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="156,hidden_states.5">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="94" name="__module.encoder.layers.0/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="157,input.19">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="95" name="__module.encoder.layers.1.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="96" name="__module.encoder.layers.1.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="97" name="Constant_9926_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="16244940" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="98" name="Constant_9926" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="99" name="__module.encoder.layers.1.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="100" name="Constant_9927_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="16246476" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="101" name="Constant_9927" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="102" name="__module.encoder.layers.1.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="165,hidden_states.7">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="103" name="self.encoder.layers.1.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="16248012" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.1.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="104" name="self.encoder.layers.1.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="105" name="__module.encoder.layers.1.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="106" name="Constant_9928_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="19786956" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="107" name="Constant_9928" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="108" name="__module.encoder.layers.1.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="174">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="109" name="Constant_10204" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="110" name="__module.encoder.layers.1.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="178">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="111" name="Constant_642" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="179">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="112" name="__module.encoder.layers.1.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="180,mixed_qkv.3">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="113" name="__module.encoder.layers.1.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="181,query_states.3">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="114" name="__module.encoder.layers.1.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="182,key_states.3">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="115" name="__module.encoder.layers.1.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="183,value_states.3">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="116" name="Constant_9512_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="117" name="Constant_9512" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="118" name="__module.encoder.layers.1.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="189">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="119" name="Constant_737" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="190">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="120" name="__module.encoder.layers.1.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="191,context_layer.3">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="121" name="__module.encoder.layers.1.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="122" name="__module.encoder.layers.1.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="195,input.25">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="123" name="self.encoder.layers.1.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="19791564" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.1.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="124" name="self.encoder.layers.1.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="125" name="__module.encoder.layers.1.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="126" name="Constant_9929_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="20971212" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="127" name="Constant_9929" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="128" name="__module.encoder.layers.1.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="198,hidden_states.9">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="129" name="__module.encoder.layers.1/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="199,input.27">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="130" name="__module.encoder.layers.1.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="131" name="__module.encoder.layers.1.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="132" name="Constant_9930_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="20972748" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="133" name="Constant_9930" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="134" name="__module.encoder.layers.1.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="135" name="Constant_9931_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="20974284" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="136" name="Constant_9931" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="137" name="__module.encoder.layers.1.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="203,input.29">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="138" name="self.encoder.layers.1.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="20975820" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.1.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="139" name="self.encoder.layers.1.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="140" name="__module.encoder.layers.1.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="141" name="Constant_9932_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="25694412" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="142" name="Constant_9932" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="143" name="__module.encoder.layers.1.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="209,input.31">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="144" name="__module.encoder.layers.1.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="210,input.33">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="145" name="self.encoder.layers.1.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="25700556" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.1.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="146" name="self.encoder.layers.1.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="147" name="__module.encoder.layers.1.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="148" name="Constant_9933_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="30419148" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="149" name="Constant_9933" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="150" name="__module.encoder.layers.1.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="213,hidden_states.11">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="151" name="__module.encoder.layers.1/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="214,input.35">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="152" name="__module.encoder.layers.2.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="153" name="__module.encoder.layers.2.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="154" name="Constant_9934_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="30420684" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="155" name="Constant_9934" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="156" name="__module.encoder.layers.2.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="157" name="Constant_9935_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="30422220" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="158" name="Constant_9935" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="159" name="__module.encoder.layers.2.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="222,hidden_states.13">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="160" name="self.encoder.layers.2.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="30423756" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.2.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="161" name="self.encoder.layers.2.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="162" name="__module.encoder.layers.2.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="163" name="Constant_9936_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="33962700" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="164" name="Constant_9936" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="165" name="__module.encoder.layers.2.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="231">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="166" name="Constant_10205" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="167" name="__module.encoder.layers.2.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="235">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="168" name="Constant_920" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="236">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="169" name="__module.encoder.layers.2.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="237,mixed_qkv.5">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="170" name="__module.encoder.layers.2.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="238,query_states.5">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="171" name="__module.encoder.layers.2.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="239,key_states.5">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="172" name="__module.encoder.layers.2.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="240,value_states.5">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="173" name="Constant_9528_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="174" name="Constant_9528" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="175" name="__module.encoder.layers.2.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="246">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="176" name="Constant_1015" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="247">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="177" name="__module.encoder.layers.2.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="248,context_layer.5">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="178" name="__module.encoder.layers.2.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="179" name="__module.encoder.layers.2.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="252,input.41">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="180" name="self.encoder.layers.2.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="33967308" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.2.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="181" name="self.encoder.layers.2.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="182" name="__module.encoder.layers.2.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="183" name="Constant_9937_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="35146956" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="184" name="Constant_9937" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="185" name="__module.encoder.layers.2.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="255,hidden_states.15">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="186" name="__module.encoder.layers.2/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="256,input.43">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="187" name="__module.encoder.layers.2.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="188" name="__module.encoder.layers.2.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="189" name="Constant_9938_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="35148492" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="190" name="Constant_9938" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="191" name="__module.encoder.layers.2.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="192" name="Constant_9939_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="35150028" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="193" name="Constant_9939" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="194" name="__module.encoder.layers.2.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="260,input.45">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="195" name="self.encoder.layers.2.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="35151564" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.2.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="196" name="self.encoder.layers.2.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="197" name="__module.encoder.layers.2.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="198" name="Constant_9940_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="39870156" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="199" name="Constant_9940" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="200" name="__module.encoder.layers.2.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="266,input.47">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="201" name="__module.encoder.layers.2.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="267,input.49">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="202" name="self.encoder.layers.2.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="39876300" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.2.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="203" name="self.encoder.layers.2.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="204" name="__module.encoder.layers.2.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="205" name="Constant_9941_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="44594892" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="206" name="Constant_9941" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="207" name="__module.encoder.layers.2.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="270,hidden_states.17">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="208" name="__module.encoder.layers.2/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="271,input.51">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="209" name="__module.encoder.layers.3.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="210" name="__module.encoder.layers.3.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="211" name="Constant_9942_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="44596428" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="212" name="Constant_9942" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="213" name="__module.encoder.layers.3.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="214" name="Constant_9943_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="44597964" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="215" name="Constant_9943" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="216" name="__module.encoder.layers.3.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="279,hidden_states.19">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="217" name="self.encoder.layers.3.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="44599500" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.3.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="218" name="self.encoder.layers.3.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="219" name="__module.encoder.layers.3.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="220" name="Constant_9944_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="48138444" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="221" name="Constant_9944" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="222" name="__module.encoder.layers.3.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="288">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="223" name="Constant_10206" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="224" name="__module.encoder.layers.3.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="292">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="225" name="Constant_1198" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="293">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="226" name="__module.encoder.layers.3.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="294,mixed_qkv.7">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="227" name="__module.encoder.layers.3.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="295,query_states.7">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="228" name="__module.encoder.layers.3.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="296,key_states.7">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="229" name="__module.encoder.layers.3.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="297,value_states.7">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="230" name="Constant_9544_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="231" name="Constant_9544" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="232" name="__module.encoder.layers.3.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="303">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="233" name="Constant_1293" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="304">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="234" name="__module.encoder.layers.3.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="305,context_layer.7">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="235" name="__module.encoder.layers.3.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="236" name="__module.encoder.layers.3.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="309,input.57">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="237" name="self.encoder.layers.3.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="48143052" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.3.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="238" name="self.encoder.layers.3.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="239" name="__module.encoder.layers.3.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="240" name="Constant_9945_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="49322700" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="241" name="Constant_9945" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="242" name="__module.encoder.layers.3.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="312,hidden_states.21">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="243" name="__module.encoder.layers.3/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="313,input.59">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="244" name="__module.encoder.layers.3.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="245" name="__module.encoder.layers.3.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="246" name="Constant_9946_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="49324236" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="247" name="Constant_9946" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="248" name="__module.encoder.layers.3.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="249" name="Constant_9947_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="49325772" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="250" name="Constant_9947" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="251" name="__module.encoder.layers.3.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="317,input.61">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="252" name="self.encoder.layers.3.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="49327308" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.3.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="253" name="self.encoder.layers.3.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="254" name="__module.encoder.layers.3.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="255" name="Constant_9948_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="54045900" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="256" name="Constant_9948" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="257" name="__module.encoder.layers.3.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="323,input.63">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="258" name="__module.encoder.layers.3.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="324,input.65">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="259" name="self.encoder.layers.3.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="54052044" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.3.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="260" name="self.encoder.layers.3.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="261" name="__module.encoder.layers.3.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="262" name="Constant_9949_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="58770636" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="263" name="Constant_9949" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="264" name="__module.encoder.layers.3.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="327,hidden_states.23">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="265" name="__module.encoder.layers.3/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="328,input.67">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="266" name="__module.encoder.layers.4.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="267" name="__module.encoder.layers.4.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="268" name="Constant_9950_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="58772172" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="269" name="Constant_9950" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="270" name="__module.encoder.layers.4.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="271" name="Constant_9951_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="58773708" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="272" name="Constant_9951" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="273" name="__module.encoder.layers.4.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="336,hidden_states.25">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="274" name="self.encoder.layers.4.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="58775244" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.4.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="275" name="self.encoder.layers.4.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="276" name="__module.encoder.layers.4.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="277" name="Constant_9952_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="62314188" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="278" name="Constant_9952" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="279" name="__module.encoder.layers.4.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="345">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="280" name="Constant_10207" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="281" name="__module.encoder.layers.4.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="349">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="282" name="Constant_1476" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="350">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="283" name="__module.encoder.layers.4.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="351,mixed_qkv.9">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="284" name="__module.encoder.layers.4.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="352,query_states.9">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="285" name="__module.encoder.layers.4.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="353,key_states.9">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="286" name="__module.encoder.layers.4.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="354,value_states.9">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="287" name="Constant_9560_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="288" name="Constant_9560" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="289" name="__module.encoder.layers.4.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="360">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="290" name="Constant_1571" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="361">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="291" name="__module.encoder.layers.4.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="362,context_layer.9">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="292" name="__module.encoder.layers.4.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="293" name="__module.encoder.layers.4.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="366,input.73">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="294" name="self.encoder.layers.4.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="62318796" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.4.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="295" name="self.encoder.layers.4.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="296" name="__module.encoder.layers.4.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="297" name="Constant_9953_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="63498444" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="298" name="Constant_9953" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="299" name="__module.encoder.layers.4.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="369,hidden_states.27">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="300" name="__module.encoder.layers.4/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="370,input.75">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="301" name="__module.encoder.layers.4.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="302" name="__module.encoder.layers.4.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="303" name="Constant_9954_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="63499980" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="304" name="Constant_9954" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="305" name="__module.encoder.layers.4.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="306" name="Constant_9955_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="63501516" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="307" name="Constant_9955" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="308" name="__module.encoder.layers.4.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="374,input.77">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="309" name="self.encoder.layers.4.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="63503052" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.4.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="310" name="self.encoder.layers.4.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="311" name="__module.encoder.layers.4.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="312" name="Constant_9956_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="68221644" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="313" name="Constant_9956" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="314" name="__module.encoder.layers.4.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="380,input.79">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="315" name="__module.encoder.layers.4.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="381,input.81">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="316" name="self.encoder.layers.4.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="68227788" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.4.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="317" name="self.encoder.layers.4.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="318" name="__module.encoder.layers.4.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="319" name="Constant_9957_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="72946380" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="320" name="Constant_9957" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="321" name="__module.encoder.layers.4.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="384,hidden_states.29">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="322" name="__module.encoder.layers.4/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="385,input.83">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="323" name="__module.encoder.layers.5.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="324" name="__module.encoder.layers.5.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="325" name="Constant_9958_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="72947916" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="326" name="Constant_9958" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="327" name="__module.encoder.layers.5.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="328" name="Constant_9959_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="72949452" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="329" name="Constant_9959" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="330" name="__module.encoder.layers.5.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="393,hidden_states.31">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="331" name="self.encoder.layers.5.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="72950988" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.5.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="332" name="self.encoder.layers.5.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="333" name="__module.encoder.layers.5.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="334" name="Constant_9960_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="76489932" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="335" name="Constant_9960" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="336" name="__module.encoder.layers.5.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="402">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="337" name="Constant_10208" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="338" name="__module.encoder.layers.5.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="406">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="339" name="Constant_1754" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="407">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="340" name="__module.encoder.layers.5.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="408,mixed_qkv.11">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="341" name="__module.encoder.layers.5.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="409,query_states.11">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="342" name="__module.encoder.layers.5.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="410,key_states.11">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="343" name="__module.encoder.layers.5.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="411,value_states.11">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="344" name="Constant_9576_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="345" name="Constant_9576" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="346" name="__module.encoder.layers.5.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="417">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="347" name="Constant_1849" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="418">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="348" name="__module.encoder.layers.5.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="419,context_layer.11">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="349" name="__module.encoder.layers.5.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="350" name="__module.encoder.layers.5.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="423,input.89">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="351" name="self.encoder.layers.5.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="76494540" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.5.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="352" name="self.encoder.layers.5.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="353" name="__module.encoder.layers.5.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="354" name="Constant_9961_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="77674188" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="355" name="Constant_9961" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="356" name="__module.encoder.layers.5.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="426,hidden_states.33">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="357" name="__module.encoder.layers.5/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="427,input.91">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="358" name="__module.encoder.layers.5.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="359" name="__module.encoder.layers.5.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="360" name="Constant_9962_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="77675724" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="361" name="Constant_9962" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="362" name="__module.encoder.layers.5.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="363" name="Constant_9963_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="77677260" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="364" name="Constant_9963" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="365" name="__module.encoder.layers.5.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="431,input.93">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="366" name="self.encoder.layers.5.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="77678796" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.5.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="367" name="self.encoder.layers.5.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="368" name="__module.encoder.layers.5.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="369" name="Constant_9964_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="82397388" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="370" name="Constant_9964" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="371" name="__module.encoder.layers.5.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="437,input.95">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="372" name="__module.encoder.layers.5.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="438,input.97">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="373" name="self.encoder.layers.5.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="82403532" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.5.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="374" name="self.encoder.layers.5.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="375" name="__module.encoder.layers.5.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="376" name="Constant_9965_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="87122124" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="377" name="Constant_9965" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="378" name="__module.encoder.layers.5.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="441,hidden_states.35">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="379" name="__module.encoder.layers.5/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="442,input.99">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="380" name="__module.encoder.layers.6.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="381" name="__module.encoder.layers.6.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="382" name="Constant_9966_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="87123660" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="383" name="Constant_9966" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="384" name="__module.encoder.layers.6.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="385" name="Constant_9967_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="87125196" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="386" name="Constant_9967" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="387" name="__module.encoder.layers.6.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="450,hidden_states.37">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="388" name="self.encoder.layers.6.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="87126732" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.6.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="389" name="self.encoder.layers.6.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="390" name="__module.encoder.layers.6.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="391" name="Constant_9968_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="90665676" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="392" name="Constant_9968" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="393" name="__module.encoder.layers.6.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="459">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="394" name="Constant_10209" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="395" name="__module.encoder.layers.6.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="463">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="396" name="Constant_2032" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="464">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="397" name="__module.encoder.layers.6.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="465,mixed_qkv.13">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="398" name="__module.encoder.layers.6.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="466,query_states.13">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="399" name="__module.encoder.layers.6.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="467,key_states.13">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="400" name="__module.encoder.layers.6.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="468,value_states.13">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="401" name="Constant_9592_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="402" name="Constant_9592" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="403" name="__module.encoder.layers.6.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="474">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="404" name="Constant_2127" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="475">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="405" name="__module.encoder.layers.6.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="476,context_layer.13">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="406" name="__module.encoder.layers.6.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="407" name="__module.encoder.layers.6.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="480,input.105">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="408" name="self.encoder.layers.6.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="90670284" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.6.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="409" name="self.encoder.layers.6.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="410" name="__module.encoder.layers.6.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="411" name="Constant_9969_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="91849932" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="412" name="Constant_9969" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="413" name="__module.encoder.layers.6.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="483,hidden_states.39">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="414" name="__module.encoder.layers.6/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="484,input.107">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="415" name="__module.encoder.layers.6.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="416" name="__module.encoder.layers.6.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="417" name="Constant_9970_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="91851468" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="418" name="Constant_9970" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="419" name="__module.encoder.layers.6.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="420" name="Constant_9971_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="91853004" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="421" name="Constant_9971" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="422" name="__module.encoder.layers.6.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="488,input.109">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="423" name="self.encoder.layers.6.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="91854540" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.6.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="424" name="self.encoder.layers.6.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="425" name="__module.encoder.layers.6.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="426" name="Constant_9972_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="96573132" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="427" name="Constant_9972" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="428" name="__module.encoder.layers.6.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="494,input.111">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="429" name="__module.encoder.layers.6.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="495,input.113">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="430" name="self.encoder.layers.6.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="96579276" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.6.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="431" name="self.encoder.layers.6.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="432" name="__module.encoder.layers.6.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="433" name="Constant_9973_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="101297868" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="434" name="Constant_9973" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="435" name="__module.encoder.layers.6.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="498,hidden_states.41">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="436" name="__module.encoder.layers.6/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="499,input.115">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="437" name="__module.encoder.layers.7.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="438" name="__module.encoder.layers.7.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="439" name="Constant_9974_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="101299404" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="440" name="Constant_9974" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="441" name="__module.encoder.layers.7.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="442" name="Constant_9975_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="101300940" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="443" name="Constant_9975" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="444" name="__module.encoder.layers.7.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="507,hidden_states.43">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="445" name="self.encoder.layers.7.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="101302476" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.7.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="446" name="self.encoder.layers.7.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="447" name="__module.encoder.layers.7.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="448" name="Constant_9976_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="104841420" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="449" name="Constant_9976" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="450" name="__module.encoder.layers.7.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="516">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="451" name="Constant_10210" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="452" name="__module.encoder.layers.7.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="520">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="453" name="Constant_2310" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="521">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="454" name="__module.encoder.layers.7.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="522,mixed_qkv.15">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="455" name="__module.encoder.layers.7.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="523,query_states.15">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="456" name="__module.encoder.layers.7.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="524,key_states.15">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="457" name="__module.encoder.layers.7.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="525,value_states.15">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="458" name="Constant_9608_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="459" name="Constant_9608" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="460" name="__module.encoder.layers.7.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="531">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="461" name="Constant_2405" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="532">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="462" name="__module.encoder.layers.7.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="533,context_layer.15">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="463" name="__module.encoder.layers.7.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="464" name="__module.encoder.layers.7.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="537,input.121">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="465" name="self.encoder.layers.7.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="104846028" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.7.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="466" name="self.encoder.layers.7.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="467" name="__module.encoder.layers.7.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="468" name="Constant_9977_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="106025676" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="469" name="Constant_9977" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="470" name="__module.encoder.layers.7.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="540,hidden_states.45">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="471" name="__module.encoder.layers.7/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="541,input.123">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="472" name="__module.encoder.layers.7.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="473" name="__module.encoder.layers.7.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="474" name="Constant_9978_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="106027212" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="475" name="Constant_9978" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="476" name="__module.encoder.layers.7.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="477" name="Constant_9979_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="106028748" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="478" name="Constant_9979" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="479" name="__module.encoder.layers.7.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="545,input.125">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="480" name="self.encoder.layers.7.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="106030284" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.7.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="481" name="self.encoder.layers.7.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="482" name="__module.encoder.layers.7.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="483" name="Constant_9980_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="110748876" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="484" name="Constant_9980" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="485" name="__module.encoder.layers.7.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="551,input.127">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="486" name="__module.encoder.layers.7.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="552,input.129">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="487" name="self.encoder.layers.7.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="110755020" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.7.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="488" name="self.encoder.layers.7.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="489" name="__module.encoder.layers.7.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="490" name="Constant_9981_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="115473612" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="491" name="Constant_9981" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="492" name="__module.encoder.layers.7.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="555,hidden_states.47">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="493" name="__module.encoder.layers.7/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="556,input.131">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="494" name="__module.encoder.layers.8.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="495" name="__module.encoder.layers.8.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="496" name="Constant_9982_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="115475148" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="497" name="Constant_9982" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="498" name="__module.encoder.layers.8.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="499" name="Constant_9983_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="115476684" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="500" name="Constant_9983" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="501" name="__module.encoder.layers.8.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="564,hidden_states.49">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="502" name="self.encoder.layers.8.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="115478220" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.8.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="503" name="self.encoder.layers.8.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="504" name="__module.encoder.layers.8.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="505" name="Constant_9984_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="119017164" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="506" name="Constant_9984" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="507" name="__module.encoder.layers.8.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="573">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="508" name="Constant_10211" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="509" name="__module.encoder.layers.8.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="577">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="510" name="Constant_2588" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="578">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="511" name="__module.encoder.layers.8.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="579,mixed_qkv.17">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="512" name="__module.encoder.layers.8.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="580,query_states.17">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="513" name="__module.encoder.layers.8.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="581,key_states.17">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="514" name="__module.encoder.layers.8.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="582,value_states.17">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="515" name="Constant_9624_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="516" name="Constant_9624" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="517" name="__module.encoder.layers.8.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="588">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="518" name="Constant_2683" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="589">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="519" name="__module.encoder.layers.8.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="590,context_layer.17">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="520" name="__module.encoder.layers.8.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="521" name="__module.encoder.layers.8.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="594,input.137">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="522" name="self.encoder.layers.8.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="119021772" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.8.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="523" name="self.encoder.layers.8.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="524" name="__module.encoder.layers.8.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="525" name="Constant_9985_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="120201420" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="526" name="Constant_9985" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="527" name="__module.encoder.layers.8.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="597,hidden_states.51">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="528" name="__module.encoder.layers.8/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="598,input.139">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="529" name="__module.encoder.layers.8.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="530" name="__module.encoder.layers.8.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="531" name="Constant_9986_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="120202956" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="532" name="Constant_9986" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="533" name="__module.encoder.layers.8.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="534" name="Constant_9987_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="120204492" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="535" name="Constant_9987" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="536" name="__module.encoder.layers.8.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="602,input.141">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="537" name="self.encoder.layers.8.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="120206028" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.8.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="538" name="self.encoder.layers.8.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="539" name="__module.encoder.layers.8.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="540" name="Constant_9988_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="124924620" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="541" name="Constant_9988" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="542" name="__module.encoder.layers.8.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="608,input.143">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="543" name="__module.encoder.layers.8.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="609,input.145">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="544" name="self.encoder.layers.8.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="124930764" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.8.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="545" name="self.encoder.layers.8.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="546" name="__module.encoder.layers.8.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="547" name="Constant_9989_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="129649356" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="548" name="Constant_9989" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="549" name="__module.encoder.layers.8.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="612,hidden_states.53">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="550" name="__module.encoder.layers.8/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="613,input.147">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="551" name="__module.encoder.layers.9.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="552" name="__module.encoder.layers.9.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="553" name="Constant_9990_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="129650892" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="554" name="Constant_9990" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="555" name="__module.encoder.layers.9.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="556" name="Constant_9991_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="129652428" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="557" name="Constant_9991" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="558" name="__module.encoder.layers.9.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="621,hidden_states.55">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="559" name="self.encoder.layers.9.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="129653964" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.9.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="560" name="self.encoder.layers.9.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="561" name="__module.encoder.layers.9.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="562" name="Constant_9992_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="133192908" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="563" name="Constant_9992" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="564" name="__module.encoder.layers.9.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="630">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="565" name="Constant_10212" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="566" name="__module.encoder.layers.9.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="634">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="567" name="Constant_2866" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="635">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="568" name="__module.encoder.layers.9.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="636,mixed_qkv.19">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="569" name="__module.encoder.layers.9.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="637,query_states.19">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="570" name="__module.encoder.layers.9.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="638,key_states.19">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="571" name="__module.encoder.layers.9.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="639,value_states.19">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="572" name="Constant_9640_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="573" name="Constant_9640" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="574" name="__module.encoder.layers.9.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="645">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="575" name="Constant_2961" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="646">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="576" name="__module.encoder.layers.9.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="647,context_layer.19">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="577" name="__module.encoder.layers.9.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="578" name="__module.encoder.layers.9.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="651,input.153">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="579" name="self.encoder.layers.9.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="133197516" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.9.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="580" name="self.encoder.layers.9.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="581" name="__module.encoder.layers.9.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="582" name="Constant_9993_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="134377164" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="583" name="Constant_9993" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="584" name="__module.encoder.layers.9.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="654,hidden_states.57">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="585" name="__module.encoder.layers.9/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="655,input.155">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="586" name="__module.encoder.layers.9.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="587" name="__module.encoder.layers.9.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="588" name="Constant_9994_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="134378700" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="589" name="Constant_9994" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="590" name="__module.encoder.layers.9.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="591" name="Constant_9995_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="134380236" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="592" name="Constant_9995" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="593" name="__module.encoder.layers.9.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="659,input.157">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="594" name="self.encoder.layers.9.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="134381772" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.9.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="595" name="self.encoder.layers.9.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="596" name="__module.encoder.layers.9.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="597" name="Constant_9996_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="139100364" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="598" name="Constant_9996" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="599" name="__module.encoder.layers.9.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="665,input.159">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="600" name="__module.encoder.layers.9.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="666,input.161">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="601" name="self.encoder.layers.9.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="139106508" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.9.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="602" name="self.encoder.layers.9.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="603" name="__module.encoder.layers.9.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="604" name="Constant_9997_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="143825100" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="605" name="Constant_9997" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="606" name="__module.encoder.layers.9.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="669,hidden_states.59">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="607" name="__module.encoder.layers.9/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="670,input.163">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="608" name="__module.encoder.layers.10.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="609" name="__module.encoder.layers.10.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="610" name="Constant_9998_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="143826636" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="611" name="Constant_9998" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="612" name="__module.encoder.layers.10.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="613" name="Constant_9999_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="143828172" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="614" name="Constant_9999" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="615" name="__module.encoder.layers.10.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="678,hidden_states.61">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="616" name="self.encoder.layers.10.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="143829708" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.10.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="617" name="self.encoder.layers.10.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="618" name="__module.encoder.layers.10.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="619" name="Constant_10000_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="147368652" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="620" name="Constant_10000" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="621" name="__module.encoder.layers.10.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="687">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="622" name="Constant_10213" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="623" name="__module.encoder.layers.10.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="691">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="624" name="Constant_3144" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="692">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="625" name="__module.encoder.layers.10.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="693,mixed_qkv.21">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="626" name="__module.encoder.layers.10.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="694,query_states.21">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="627" name="__module.encoder.layers.10.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="695,key_states.21">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="628" name="__module.encoder.layers.10.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="696,value_states.21">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="629" name="Constant_9656_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="630" name="Constant_9656" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="631" name="__module.encoder.layers.10.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="702">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="632" name="Constant_3239" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="703">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="633" name="__module.encoder.layers.10.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="704,context_layer.21">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="634" name="__module.encoder.layers.10.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="635" name="__module.encoder.layers.10.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="708,input.169">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="636" name="self.encoder.layers.10.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="147373260" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.10.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="637" name="self.encoder.layers.10.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="638" name="__module.encoder.layers.10.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="639" name="Constant_10001_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="148552908" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="640" name="Constant_10001" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="641" name="__module.encoder.layers.10.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="711,hidden_states.63">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="642" name="__module.encoder.layers.10/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="712,input.171">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="643" name="__module.encoder.layers.10.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="644" name="__module.encoder.layers.10.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="645" name="Constant_10002_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="148554444" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="646" name="Constant_10002" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="647" name="__module.encoder.layers.10.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="648" name="Constant_10003_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="148555980" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="649" name="Constant_10003" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="650" name="__module.encoder.layers.10.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="716,input.173">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="651" name="self.encoder.layers.10.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="148557516" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.10.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="652" name="self.encoder.layers.10.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="653" name="__module.encoder.layers.10.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="654" name="Constant_10004_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="153276108" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="655" name="Constant_10004" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="656" name="__module.encoder.layers.10.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="722,input.175">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="657" name="__module.encoder.layers.10.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="723,input.177">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="658" name="self.encoder.layers.10.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="153282252" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.10.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="659" name="self.encoder.layers.10.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="660" name="__module.encoder.layers.10.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="661" name="Constant_10005_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="158000844" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="662" name="Constant_10005" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="663" name="__module.encoder.layers.10.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="726,hidden_states.65">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="664" name="__module.encoder.layers.10/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="727,input.179">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="665" name="__module.encoder.layers.11.layer_norm1/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="666" name="__module.encoder.layers.11.layer_norm1/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="667" name="Constant_10006_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="158002380" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="668" name="Constant_10006" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="669" name="__module.encoder.layers.11.layer_norm1/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="670" name="Constant_10007_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="158003916" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="671" name="Constant_10007" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="672" name="__module.encoder.layers.11.layer_norm1/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="735,hidden_states.67">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="673" name="self.encoder.layers.11.self_attn.qkv.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="2304, 768" offset="158005452" size="3538944" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.11.self_attn.qkv.weight">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="674" name="self.encoder.layers.11.self_attn.qkv.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="675" name="__module.encoder.layers.11.self_attn.qkv/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>2304</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="676" name="Constant_10008_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 2304" offset="161544396" size="4608" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="677" name="Constant_10008" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="678" name="__module.encoder.layers.11.self_attn.qkv/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="744">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="679" name="Constant_10214" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615672" size="40" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="680" name="__module.encoder.layers.11.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>2304</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="748">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="681" name="Constant_3422" type="Const" version="opset1">
|
| <data element_type="i64" shape="5" offset="5615712" size="40" />
|
| <output>
|
| <port id="0" precision="I64" names="749">
|
| <dim>5</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="682" name="__module.encoder.layers.11.self_attn/aten::permute/Transpose" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>5</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="750,mixed_qkv">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="683" name="__module.encoder.layers.11.self_attn/aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="751,query_states">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="684" name="__module.encoder.layers.11.self_attn/aten::select/Gather_1" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="752,key_states">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="685" name="__module.encoder.layers.11.self_attn/aten::select/Gather_2" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>3</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="753,value_states">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="686" name="Constant_9672_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="" offset="5615760" size="2" />
|
| <output>
|
| <port id="0" precision="FP16" />
|
| </output>
|
| </layer>
|
| <layer id="687" name="Constant_9672" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16" />
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" />
|
| </output>
|
| </layer>
|
| <layer id="688" name="__module.encoder.layers.11.self_attn/aten::matmul/MatMul_1" type="ScaledDotProductAttention" version="opset13">
|
| <data causal="false" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="3" precision="FP32" />
|
| <port id="4" precision="FP32" />
|
| </input>
|
| <output>
|
| <port id="5" precision="FP32" names="759">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="689" name="Constant_3517" type="Const" version="opset1">
|
| <data element_type="i64" shape="4" offset="5615764" size="32" />
|
| <output>
|
| <port id="0" precision="I64" names="760">
|
| <dim>4</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="690" name="__module.encoder.layers.11.self_attn/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>-1</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>4</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="761,context_layer">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="691" name="__module.encoder.layers.11.self_attn/prim::ListConstruct_1" type="Const" version="opset1">
|
| <data element_type="i64" shape="3" offset="5615796" size="24" />
|
| <rt_info>
|
| <attribute name="precise" version="0" />
|
| </rt_info>
|
| <output>
|
| <port id="0" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="692" name="__module.encoder.layers.11.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1">
|
| <data special_zero="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>12</dim>
|
| <dim>64</dim>
|
| </port>
|
| <port id="1" precision="I64">
|
| <dim>3</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="765,input.185">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="693" name="self.encoder.layers.11.self_attn.projection.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 768" offset="161549004" size="1179648" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.11.self_attn.projection.weight">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="694" name="self.encoder.layers.11.self_attn.projection.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="695" name="__module.encoder.layers.11.self_attn.projection/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="696" name="Constant_10009_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="162728652" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="697" name="Constant_10009" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="698" name="__module.encoder.layers.11.self_attn.projection/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="768,hidden_states.69">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="699" name="__module.encoder.layers.11/aten::add/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="769,input.187">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="700" name="__module.encoder.layers.11.layer_norm2/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="701" name="__module.encoder.layers.11.layer_norm2/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="702" name="Constant_10010_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="162730188" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="703" name="Constant_10010" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="704" name="__module.encoder.layers.11.layer_norm2/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="705" name="Constant_10011_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="162731724" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="706" name="Constant_10011" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="707" name="__module.encoder.layers.11.layer_norm2/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="773,input.189">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="708" name="self.encoder.layers.11.mlp.fc1.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="3072, 768" offset="162733260" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.11.mlp.fc1.weight">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="709" name="self.encoder.layers.11.mlp.fc1.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="710" name="__module.encoder.layers.11.mlp.fc1/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>3072</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="711" name="Constant_10012_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 3072" offset="167451852" size="6144" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="712" name="Constant_10012" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="713" name="__module.encoder.layers.11.mlp.fc1/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="779,input.191">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="714" name="__module.encoder.layers.11.mlp.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
| <data approximation_mode="ERF" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32" names="780,input.193">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="715" name="self.encoder.layers.11.mlp.fc2.weight_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="768, 3072" offset="167457996" size="4718592" />
|
| <output>
|
| <port id="0" precision="FP16" names="self.encoder.layers.11.mlp.fc2.weight">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="716" name="self.encoder.layers.11.mlp.fc2.weight" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="717" name="__module.encoder.layers.11.mlp.fc2/aten::linear/MatMul" type="MatMul" version="opset1">
|
| <data transpose_a="false" transpose_b="true" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>3072</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>768</dim>
|
| <dim>3072</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="718" name="Constant_10013_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="172176588" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="719" name="Constant_10013" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="720" name="__module.encoder.layers.11.mlp.fc2/aten::linear/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="783,hidden_states">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="721" name="__module.encoder.layers.11/aten::add/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="784,input.195">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="722" name="__module.post_layernorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="723" name="__module.post_layernorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="724" name="Constant_10014_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="172178124" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="725" name="Constant_10014" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="726" name="__module.post_layernorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="727" name="Constant_10015_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 1, 768" offset="172179660" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="728" name="Constant_10015" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="729" name="__module.post_layernorm/aten::layer_norm/Add" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="12,last_hidden_state">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="730" name="14" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="1182720" size="8" />
|
| <output>
|
| <port id="0" precision="I64" names="14" />
|
| </output>
|
| </layer>
|
| <layer id="731" name="13" type="Const" version="opset1">
|
| <data element_type="i64" shape="" offset="1182728" size="8" />
|
| <output>
|
| <port id="0" precision="I64" names="13" />
|
| </output>
|
| </layer>
|
| <layer id="732" name="aten::select/Gather" type="Gather" version="opset8">
|
| <data batch_dims="0" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I64" />
|
| <port id="2" precision="I64" />
|
| </input>
|
| <output>
|
| <port id="3" precision="FP32" names="15,20,input">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="733" name="__module.post_layernorm/aten::layer_norm/Multiply_2" type="Const" version="opset1">
|
| <data element_type="i32" shape="1" offset="2069044" size="4" />
|
| <output>
|
| <port id="0" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="734" name="__module.post_layernorm/aten::layer_norm/MVN_1" type="MVN" version="opset6">
|
| <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="I32">
|
| <dim>1</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="735" name="Constant_10016_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 768" offset="172178124" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="736" name="Constant_10016" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="737" name="__module.post_layernorm/aten::layer_norm/Multiply_3" type="Multiply" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="738" name="Constant_10017_compressed" type="Const" version="opset1">
|
| <data element_type="f16" shape="1, 768" offset="172179660" size="1536" />
|
| <output>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="739" name="Constant_10017" type="Convert" version="opset1">
|
| <data destination_type="f32" />
|
| <rt_info>
|
| <attribute name="decompression" version="0" />
|
| </rt_info>
|
| <input>
|
| <port id="0" precision="FP16">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="740" name="__module.post_layernorm/aten::layer_norm/Add_1" type="Add" version="opset1">
|
| <data auto_broadcast="numpy" />
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| <port id="1" precision="FP32">
|
| <dim>1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| <output>
|
| <port id="2" precision="FP32" names="pooler_output">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </output>
|
| </layer>
|
| <layer id="742" name="Result_3716" type="Result" version="opset1" output_names="12,last_hidden_state">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| </layer>
|
| <layer id="741" name="Result_3717" type="Result" version="opset1" output_names="pooler_output">
|
| <input>
|
| <port id="0" precision="FP32">
|
| <dim>-1</dim>
|
| <dim>768</dim>
|
| </port>
|
| </input>
|
| </layer>
|
| </layers>
|
| <edges>
|
| <edge from-layer="0" from-port="0" to-layer="5" to-port="0" />
|
| <edge from-layer="1" from-port="0" to-layer="2" to-port="0" />
|
| <edge from-layer="2" from-port="1" to-layer="16" to-port="0" />
|
| <edge from-layer="3" from-port="0" to-layer="4" to-port="0" />
|
| <edge from-layer="4" from-port="1" to-layer="5" to-port="1" />
|
| <edge from-layer="5" from-port="2" to-layer="8" to-port="0" />
|
| <edge from-layer="6" from-port="0" to-layer="7" to-port="0" />
|
| <edge from-layer="7" from-port="1" to-layer="8" to-port="1" />
|
| <edge from-layer="8" from-port="2" to-layer="9" to-port="0" />
|
| <edge from-layer="8" from-port="2" to-layer="18" to-port="0" />
|
| <edge from-layer="9" from-port="1" to-layer="12" to-port="0" />
|
| <edge from-layer="10" from-port="0" to-layer="12" to-port="1" />
|
| <edge from-layer="11" from-port="0" to-layer="12" to-port="2" />
|
| <edge from-layer="12" from-port="3" to-layer="15" to-port="0" />
|
| <edge from-layer="13" from-port="0" to-layer="15" to-port="1" />
|
| <edge from-layer="14" from-port="0" to-layer="15" to-port="2" />
|
| <edge from-layer="15" from-port="3" to-layer="16" to-port="1" />
|
| <edge from-layer="16" from-port="2" to-layer="21" to-port="0" />
|
| <edge from-layer="17" from-port="0" to-layer="18" to-port="1" />
|
| <edge from-layer="18" from-port="2" to-layer="20" to-port="0" />
|
| <edge from-layer="19" from-port="0" to-layer="20" to-port="1" />
|
| <edge from-layer="20" from-port="2" to-layer="21" to-port="1" />
|
| <edge from-layer="21" from-port="2" to-layer="25" to-port="0" />
|
| <edge from-layer="21" from-port="2" to-layer="32" to-port="0" />
|
| <edge from-layer="22" from-port="0" to-layer="23" to-port="0" />
|
| <edge from-layer="23" from-port="1" to-layer="31" to-port="0" />
|
| <edge from-layer="24" from-port="0" to-layer="31" to-port="1" />
|
| <edge from-layer="25" from-port="1" to-layer="28" to-port="0" />
|
| <edge from-layer="26" from-port="0" to-layer="28" to-port="1" />
|
| <edge from-layer="27" from-port="0" to-layer="28" to-port="2" />
|
| <edge from-layer="28" from-port="3" to-layer="31" to-port="2" />
|
| <edge from-layer="29" from-port="0" to-layer="31" to-port="3" />
|
| <edge from-layer="30" from-port="0" to-layer="31" to-port="4" />
|
| <edge from-layer="31" from-port="5" to-layer="32" to-port="1" />
|
| <edge from-layer="32" from-port="2" to-layer="34" to-port="0" />
|
| <edge from-layer="32" from-port="2" to-layer="72" to-port="1" />
|
| <edge from-layer="33" from-port="0" to-layer="34" to-port="1" />
|
| <edge from-layer="34" from-port="2" to-layer="37" to-port="0" />
|
| <edge from-layer="35" from-port="0" to-layer="36" to-port="0" />
|
| <edge from-layer="36" from-port="1" to-layer="37" to-port="1" />
|
| <edge from-layer="37" from-port="2" to-layer="40" to-port="0" />
|
| <edge from-layer="38" from-port="0" to-layer="39" to-port="0" />
|
| <edge from-layer="39" from-port="1" to-layer="40" to-port="1" />
|
| <edge from-layer="40" from-port="2" to-layer="43" to-port="0" />
|
| <edge from-layer="41" from-port="0" to-layer="42" to-port="0" />
|
| <edge from-layer="42" from-port="1" to-layer="43" to-port="1" />
|
| <edge from-layer="43" from-port="2" to-layer="46" to-port="0" />
|
| <edge from-layer="44" from-port="0" to-layer="45" to-port="0" />
|
| <edge from-layer="45" from-port="1" to-layer="46" to-port="1" />
|
| <edge from-layer="46" from-port="2" to-layer="48" to-port="0" />
|
| <edge from-layer="47" from-port="0" to-layer="48" to-port="1" />
|
| <edge from-layer="48" from-port="2" to-layer="50" to-port="0" />
|
| <edge from-layer="49" from-port="0" to-layer="50" to-port="1" />
|
| <edge from-layer="50" from-port="2" to-layer="52" to-port="0" />
|
| <edge from-layer="50" from-port="2" to-layer="56" to-port="0" />
|
| <edge from-layer="50" from-port="2" to-layer="54" to-port="0" />
|
| <edge from-layer="51" from-port="0" to-layer="52" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="52" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="683" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="54" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="683" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="56" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="684" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="685" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="170" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="170" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="171" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="172" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="399" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="227" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="227" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="228" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="229" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="284" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="284" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="285" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="286" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="341" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="113" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="113" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="341" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="342" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="114" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="343" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="398" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="115" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="398" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="400" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="455" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="455" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="456" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="457" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="512" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="512" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="513" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="514" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="569" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="569" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="570" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="571" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="626" to-port="1" />
|
| <edge from-layer="51" from-port="0" to-layer="626" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="627" to-port="2" />
|
| <edge from-layer="51" from-port="0" to-layer="628" to-port="2" />
|
| <edge from-layer="52" from-port="3" to-layer="61" to-port="0" />
|
| <edge from-layer="53" from-port="0" to-layer="54" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="342" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="513" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="399" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="456" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="570" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="171" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="627" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="684" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="114" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="228" to-port="1" />
|
| <edge from-layer="53" from-port="0" to-layer="285" to-port="1" />
|
| <edge from-layer="54" from-port="3" to-layer="61" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="56" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="343" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="286" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="172" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="685" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="457" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="115" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="229" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="628" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="571" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="514" to-port="1" />
|
| <edge from-layer="55" from-port="0" to-layer="400" to-port="1" />
|
| <edge from-layer="56" from-port="3" to-layer="61" to-port="2" />
|
| <edge from-layer="57" from-port="0" to-layer="58" to-port="0" />
|
| <edge from-layer="58" from-port="1" to-layer="61" to-port="3" />
|
| <edge from-layer="59" from-port="0" to-layer="60" to-port="0" />
|
| <edge from-layer="60" from-port="1" to-layer="61" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="118" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="631" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="289" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="574" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="232" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="517" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="688" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="460" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="403" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="346" to-port="4" />
|
| <edge from-layer="60" from-port="1" to-layer="175" to-port="4" />
|
| <edge from-layer="61" from-port="5" to-layer="63" to-port="0" />
|
| <edge from-layer="62" from-port="0" to-layer="63" to-port="1" />
|
| <edge from-layer="63" from-port="2" to-layer="65" to-port="0" />
|
| <edge from-layer="64" from-port="0" to-layer="65" to-port="1" />
|
| <edge from-layer="65" from-port="2" to-layer="68" to-port="0" />
|
| <edge from-layer="66" from-port="0" to-layer="67" to-port="0" />
|
| <edge from-layer="67" from-port="1" to-layer="68" to-port="1" />
|
| <edge from-layer="68" from-port="2" to-layer="71" to-port="0" />
|
| <edge from-layer="69" from-port="0" to-layer="70" to-port="0" />
|
| <edge from-layer="70" from-port="1" to-layer="71" to-port="1" />
|
| <edge from-layer="71" from-port="2" to-layer="72" to-port="0" />
|
| <edge from-layer="72" from-port="2" to-layer="74" to-port="0" />
|
| <edge from-layer="72" from-port="2" to-layer="94" to-port="1" />
|
| <edge from-layer="73" from-port="0" to-layer="74" to-port="1" />
|
| <edge from-layer="74" from-port="2" to-layer="77" to-port="0" />
|
| <edge from-layer="75" from-port="0" to-layer="76" to-port="0" />
|
| <edge from-layer="76" from-port="1" to-layer="77" to-port="1" />
|
| <edge from-layer="77" from-port="2" to-layer="80" to-port="0" />
|
| <edge from-layer="78" from-port="0" to-layer="79" to-port="0" />
|
| <edge from-layer="79" from-port="1" to-layer="80" to-port="1" />
|
| <edge from-layer="80" from-port="2" to-layer="83" to-port="0" />
|
| <edge from-layer="81" from-port="0" to-layer="82" to-port="0" />
|
| <edge from-layer="82" from-port="1" to-layer="83" to-port="1" />
|
| <edge from-layer="83" from-port="2" to-layer="86" to-port="0" />
|
| <edge from-layer="84" from-port="0" to-layer="85" to-port="0" />
|
| <edge from-layer="85" from-port="1" to-layer="86" to-port="1" />
|
| <edge from-layer="86" from-port="2" to-layer="87" to-port="0" />
|
| <edge from-layer="87" from-port="1" to-layer="90" to-port="0" />
|
| <edge from-layer="88" from-port="0" to-layer="89" to-port="0" />
|
| <edge from-layer="89" from-port="1" to-layer="90" to-port="1" />
|
| <edge from-layer="90" from-port="2" to-layer="93" to-port="0" />
|
| <edge from-layer="91" from-port="0" to-layer="92" to-port="0" />
|
| <edge from-layer="92" from-port="1" to-layer="93" to-port="1" />
|
| <edge from-layer="93" from-port="2" to-layer="94" to-port="0" />
|
| <edge from-layer="94" from-port="2" to-layer="96" to-port="0" />
|
| <edge from-layer="94" from-port="2" to-layer="129" to-port="1" />
|
| <edge from-layer="95" from-port="0" to-layer="96" to-port="1" />
|
| <edge from-layer="96" from-port="2" to-layer="99" to-port="0" />
|
| <edge from-layer="97" from-port="0" to-layer="98" to-port="0" />
|
| <edge from-layer="98" from-port="1" to-layer="99" to-port="1" />
|
| <edge from-layer="99" from-port="2" to-layer="102" to-port="0" />
|
| <edge from-layer="100" from-port="0" to-layer="101" to-port="0" />
|
| <edge from-layer="101" from-port="1" to-layer="102" to-port="1" />
|
| <edge from-layer="102" from-port="2" to-layer="105" to-port="0" />
|
| <edge from-layer="103" from-port="0" to-layer="104" to-port="0" />
|
| <edge from-layer="104" from-port="1" to-layer="105" to-port="1" />
|
| <edge from-layer="105" from-port="2" to-layer="108" to-port="0" />
|
| <edge from-layer="106" from-port="0" to-layer="107" to-port="0" />
|
| <edge from-layer="107" from-port="1" to-layer="108" to-port="1" />
|
| <edge from-layer="108" from-port="2" to-layer="110" to-port="0" />
|
| <edge from-layer="109" from-port="0" to-layer="110" to-port="1" />
|
| <edge from-layer="110" from-port="2" to-layer="112" to-port="0" />
|
| <edge from-layer="111" from-port="0" to-layer="112" to-port="1" />
|
| <edge from-layer="112" from-port="2" to-layer="113" to-port="0" />
|
| <edge from-layer="112" from-port="2" to-layer="114" to-port="0" />
|
| <edge from-layer="112" from-port="2" to-layer="115" to-port="0" />
|
| <edge from-layer="113" from-port="3" to-layer="118" to-port="0" />
|
| <edge from-layer="114" from-port="3" to-layer="118" to-port="1" />
|
| <edge from-layer="115" from-port="3" to-layer="118" to-port="2" />
|
| <edge from-layer="116" from-port="0" to-layer="117" to-port="0" />
|
| <edge from-layer="117" from-port="1" to-layer="118" to-port="3" />
|
| <edge from-layer="118" from-port="5" to-layer="120" to-port="0" />
|
| <edge from-layer="119" from-port="0" to-layer="120" to-port="1" />
|
| <edge from-layer="120" from-port="2" to-layer="122" to-port="0" />
|
| <edge from-layer="121" from-port="0" to-layer="122" to-port="1" />
|
| <edge from-layer="122" from-port="2" to-layer="125" to-port="0" />
|
| <edge from-layer="123" from-port="0" to-layer="124" to-port="0" />
|
| <edge from-layer="124" from-port="1" to-layer="125" to-port="1" />
|
| <edge from-layer="125" from-port="2" to-layer="128" to-port="0" />
|
| <edge from-layer="126" from-port="0" to-layer="127" to-port="0" />
|
| <edge from-layer="127" from-port="1" to-layer="128" to-port="1" />
|
| <edge from-layer="128" from-port="2" to-layer="129" to-port="0" />
|
| <edge from-layer="129" from-port="2" to-layer="131" to-port="0" />
|
| <edge from-layer="129" from-port="2" to-layer="151" to-port="1" />
|
| <edge from-layer="130" from-port="0" to-layer="131" to-port="1" />
|
| <edge from-layer="131" from-port="2" to-layer="134" to-port="0" />
|
| <edge from-layer="132" from-port="0" to-layer="133" to-port="0" />
|
| <edge from-layer="133" from-port="1" to-layer="134" to-port="1" />
|
| <edge from-layer="134" from-port="2" to-layer="137" to-port="0" />
|
| <edge from-layer="135" from-port="0" to-layer="136" to-port="0" />
|
| <edge from-layer="136" from-port="1" to-layer="137" to-port="1" />
|
| <edge from-layer="137" from-port="2" to-layer="140" to-port="0" />
|
| <edge from-layer="138" from-port="0" to-layer="139" to-port="0" />
|
| <edge from-layer="139" from-port="1" to-layer="140" to-port="1" />
|
| <edge from-layer="140" from-port="2" to-layer="143" to-port="0" />
|
| <edge from-layer="141" from-port="0" to-layer="142" to-port="0" />
|
| <edge from-layer="142" from-port="1" to-layer="143" to-port="1" />
|
| <edge from-layer="143" from-port="2" to-layer="144" to-port="0" />
|
| <edge from-layer="144" from-port="1" to-layer="147" to-port="0" />
|
| <edge from-layer="145" from-port="0" to-layer="146" to-port="0" />
|
| <edge from-layer="146" from-port="1" to-layer="147" to-port="1" />
|
| <edge from-layer="147" from-port="2" to-layer="150" to-port="0" />
|
| <edge from-layer="148" from-port="0" to-layer="149" to-port="0" />
|
| <edge from-layer="149" from-port="1" to-layer="150" to-port="1" />
|
| <edge from-layer="150" from-port="2" to-layer="151" to-port="0" />
|
| <edge from-layer="151" from-port="2" to-layer="186" to-port="1" />
|
| <edge from-layer="151" from-port="2" to-layer="153" to-port="0" />
|
| <edge from-layer="152" from-port="0" to-layer="153" to-port="1" />
|
| <edge from-layer="153" from-port="2" to-layer="156" to-port="0" />
|
| <edge from-layer="154" from-port="0" to-layer="155" to-port="0" />
|
| <edge from-layer="155" from-port="1" to-layer="156" to-port="1" />
|
| <edge from-layer="156" from-port="2" to-layer="159" to-port="0" />
|
| <edge from-layer="157" from-port="0" to-layer="158" to-port="0" />
|
| <edge from-layer="158" from-port="1" to-layer="159" to-port="1" />
|
| <edge from-layer="159" from-port="2" to-layer="162" to-port="0" />
|
| <edge from-layer="160" from-port="0" to-layer="161" to-port="0" />
|
| <edge from-layer="161" from-port="1" to-layer="162" to-port="1" />
|
| <edge from-layer="162" from-port="2" to-layer="165" to-port="0" />
|
| <edge from-layer="163" from-port="0" to-layer="164" to-port="0" />
|
| <edge from-layer="164" from-port="1" to-layer="165" to-port="1" />
|
| <edge from-layer="165" from-port="2" to-layer="167" to-port="0" />
|
| <edge from-layer="166" from-port="0" to-layer="167" to-port="1" />
|
| <edge from-layer="167" from-port="2" to-layer="169" to-port="0" />
|
| <edge from-layer="168" from-port="0" to-layer="169" to-port="1" />
|
| <edge from-layer="169" from-port="2" to-layer="172" to-port="0" />
|
| <edge from-layer="169" from-port="2" to-layer="171" to-port="0" />
|
| <edge from-layer="169" from-port="2" to-layer="170" to-port="0" />
|
| <edge from-layer="170" from-port="3" to-layer="175" to-port="0" />
|
| <edge from-layer="171" from-port="3" to-layer="175" to-port="1" />
|
| <edge from-layer="172" from-port="3" to-layer="175" to-port="2" />
|
| <edge from-layer="173" from-port="0" to-layer="174" to-port="0" />
|
| <edge from-layer="174" from-port="1" to-layer="175" to-port="3" />
|
| <edge from-layer="175" from-port="5" to-layer="177" to-port="0" />
|
| <edge from-layer="176" from-port="0" to-layer="177" to-port="1" />
|
| <edge from-layer="177" from-port="2" to-layer="179" to-port="0" />
|
| <edge from-layer="178" from-port="0" to-layer="179" to-port="1" />
|
| <edge from-layer="179" from-port="2" to-layer="182" to-port="0" />
|
| <edge from-layer="180" from-port="0" to-layer="181" to-port="0" />
|
| <edge from-layer="181" from-port="1" to-layer="182" to-port="1" />
|
| <edge from-layer="182" from-port="2" to-layer="185" to-port="0" />
|
| <edge from-layer="183" from-port="0" to-layer="184" to-port="0" />
|
| <edge from-layer="184" from-port="1" to-layer="185" to-port="1" />
|
| <edge from-layer="185" from-port="2" to-layer="186" to-port="0" />
|
| <edge from-layer="186" from-port="2" to-layer="188" to-port="0" />
|
| <edge from-layer="186" from-port="2" to-layer="208" to-port="1" />
|
| <edge from-layer="187" from-port="0" to-layer="188" to-port="1" />
|
| <edge from-layer="188" from-port="2" to-layer="191" to-port="0" />
|
| <edge from-layer="189" from-port="0" to-layer="190" to-port="0" />
|
| <edge from-layer="190" from-port="1" to-layer="191" to-port="1" />
|
| <edge from-layer="191" from-port="2" to-layer="194" to-port="0" />
|
| <edge from-layer="192" from-port="0" to-layer="193" to-port="0" />
|
| <edge from-layer="193" from-port="1" to-layer="194" to-port="1" />
|
| <edge from-layer="194" from-port="2" to-layer="197" to-port="0" />
|
| <edge from-layer="195" from-port="0" to-layer="196" to-port="0" />
|
| <edge from-layer="196" from-port="1" to-layer="197" to-port="1" />
|
| <edge from-layer="197" from-port="2" to-layer="200" to-port="0" />
|
| <edge from-layer="198" from-port="0" to-layer="199" to-port="0" />
|
| <edge from-layer="199" from-port="1" to-layer="200" to-port="1" />
|
| <edge from-layer="200" from-port="2" to-layer="201" to-port="0" />
|
| <edge from-layer="201" from-port="1" to-layer="204" to-port="0" />
|
| <edge from-layer="202" from-port="0" to-layer="203" to-port="0" />
|
| <edge from-layer="203" from-port="1" to-layer="204" to-port="1" />
|
| <edge from-layer="204" from-port="2" to-layer="207" to-port="0" />
|
| <edge from-layer="205" from-port="0" to-layer="206" to-port="0" />
|
| <edge from-layer="206" from-port="1" to-layer="207" to-port="1" />
|
| <edge from-layer="207" from-port="2" to-layer="208" to-port="0" />
|
| <edge from-layer="208" from-port="2" to-layer="210" to-port="0" />
|
| <edge from-layer="208" from-port="2" to-layer="243" to-port="1" />
|
| <edge from-layer="209" from-port="0" to-layer="210" to-port="1" />
|
| <edge from-layer="210" from-port="2" to-layer="213" to-port="0" />
|
| <edge from-layer="211" from-port="0" to-layer="212" to-port="0" />
|
| <edge from-layer="212" from-port="1" to-layer="213" to-port="1" />
|
| <edge from-layer="213" from-port="2" to-layer="216" to-port="0" />
|
| <edge from-layer="214" from-port="0" to-layer="215" to-port="0" />
|
| <edge from-layer="215" from-port="1" to-layer="216" to-port="1" />
|
| <edge from-layer="216" from-port="2" to-layer="219" to-port="0" />
|
| <edge from-layer="217" from-port="0" to-layer="218" to-port="0" />
|
| <edge from-layer="218" from-port="1" to-layer="219" to-port="1" />
|
| <edge from-layer="219" from-port="2" to-layer="222" to-port="0" />
|
| <edge from-layer="220" from-port="0" to-layer="221" to-port="0" />
|
| <edge from-layer="221" from-port="1" to-layer="222" to-port="1" />
|
| <edge from-layer="222" from-port="2" to-layer="224" to-port="0" />
|
| <edge from-layer="223" from-port="0" to-layer="224" to-port="1" />
|
| <edge from-layer="224" from-port="2" to-layer="226" to-port="0" />
|
| <edge from-layer="225" from-port="0" to-layer="226" to-port="1" />
|
| <edge from-layer="226" from-port="2" to-layer="227" to-port="0" />
|
| <edge from-layer="226" from-port="2" to-layer="228" to-port="0" />
|
| <edge from-layer="226" from-port="2" to-layer="229" to-port="0" />
|
| <edge from-layer="227" from-port="3" to-layer="232" to-port="0" />
|
| <edge from-layer="228" from-port="3" to-layer="232" to-port="1" />
|
| <edge from-layer="229" from-port="3" to-layer="232" to-port="2" />
|
| <edge from-layer="230" from-port="0" to-layer="231" to-port="0" />
|
| <edge from-layer="231" from-port="1" to-layer="232" to-port="3" />
|
| <edge from-layer="232" from-port="5" to-layer="234" to-port="0" />
|
| <edge from-layer="233" from-port="0" to-layer="234" to-port="1" />
|
| <edge from-layer="234" from-port="2" to-layer="236" to-port="0" />
|
| <edge from-layer="235" from-port="0" to-layer="236" to-port="1" />
|
| <edge from-layer="236" from-port="2" to-layer="239" to-port="0" />
|
| <edge from-layer="237" from-port="0" to-layer="238" to-port="0" />
|
| <edge from-layer="238" from-port="1" to-layer="239" to-port="1" />
|
| <edge from-layer="239" from-port="2" to-layer="242" to-port="0" />
|
| <edge from-layer="240" from-port="0" to-layer="241" to-port="0" />
|
| <edge from-layer="241" from-port="1" to-layer="242" to-port="1" />
|
| <edge from-layer="242" from-port="2" to-layer="243" to-port="0" />
|
| <edge from-layer="243" from-port="2" to-layer="265" to-port="1" />
|
| <edge from-layer="243" from-port="2" to-layer="245" to-port="0" />
|
| <edge from-layer="244" from-port="0" to-layer="245" to-port="1" />
|
| <edge from-layer="245" from-port="2" to-layer="248" to-port="0" />
|
| <edge from-layer="246" from-port="0" to-layer="247" to-port="0" />
|
| <edge from-layer="247" from-port="1" to-layer="248" to-port="1" />
|
| <edge from-layer="248" from-port="2" to-layer="251" to-port="0" />
|
| <edge from-layer="249" from-port="0" to-layer="250" to-port="0" />
|
| <edge from-layer="250" from-port="1" to-layer="251" to-port="1" />
|
| <edge from-layer="251" from-port="2" to-layer="254" to-port="0" />
|
| <edge from-layer="252" from-port="0" to-layer="253" to-port="0" />
|
| <edge from-layer="253" from-port="1" to-layer="254" to-port="1" />
|
| <edge from-layer="254" from-port="2" to-layer="257" to-port="0" />
|
| <edge from-layer="255" from-port="0" to-layer="256" to-port="0" />
|
| <edge from-layer="256" from-port="1" to-layer="257" to-port="1" />
|
| <edge from-layer="257" from-port="2" to-layer="258" to-port="0" />
|
| <edge from-layer="258" from-port="1" to-layer="261" to-port="0" />
|
| <edge from-layer="259" from-port="0" to-layer="260" to-port="0" />
|
| <edge from-layer="260" from-port="1" to-layer="261" to-port="1" />
|
| <edge from-layer="261" from-port="2" to-layer="264" to-port="0" />
|
| <edge from-layer="262" from-port="0" to-layer="263" to-port="0" />
|
| <edge from-layer="263" from-port="1" to-layer="264" to-port="1" />
|
| <edge from-layer="264" from-port="2" to-layer="265" to-port="0" />
|
| <edge from-layer="265" from-port="2" to-layer="300" to-port="1" />
|
| <edge from-layer="265" from-port="2" to-layer="267" to-port="0" />
|
| <edge from-layer="266" from-port="0" to-layer="267" to-port="1" />
|
| <edge from-layer="267" from-port="2" to-layer="270" to-port="0" />
|
| <edge from-layer="268" from-port="0" to-layer="269" to-port="0" />
|
| <edge from-layer="269" from-port="1" to-layer="270" to-port="1" />
|
| <edge from-layer="270" from-port="2" to-layer="273" to-port="0" />
|
| <edge from-layer="271" from-port="0" to-layer="272" to-port="0" />
|
| <edge from-layer="272" from-port="1" to-layer="273" to-port="1" />
|
| <edge from-layer="273" from-port="2" to-layer="276" to-port="0" />
|
| <edge from-layer="274" from-port="0" to-layer="275" to-port="0" />
|
| <edge from-layer="275" from-port="1" to-layer="276" to-port="1" />
|
| <edge from-layer="276" from-port="2" to-layer="279" to-port="0" />
|
| <edge from-layer="277" from-port="0" to-layer="278" to-port="0" />
|
| <edge from-layer="278" from-port="1" to-layer="279" to-port="1" />
|
| <edge from-layer="279" from-port="2" to-layer="281" to-port="0" />
|
| <edge from-layer="280" from-port="0" to-layer="281" to-port="1" />
|
| <edge from-layer="281" from-port="2" to-layer="283" to-port="0" />
|
| <edge from-layer="282" from-port="0" to-layer="283" to-port="1" />
|
| <edge from-layer="283" from-port="2" to-layer="284" to-port="0" />
|
| <edge from-layer="283" from-port="2" to-layer="285" to-port="0" />
|
| <edge from-layer="283" from-port="2" to-layer="286" to-port="0" />
|
| <edge from-layer="284" from-port="3" to-layer="289" to-port="0" />
|
| <edge from-layer="285" from-port="3" to-layer="289" to-port="1" />
|
| <edge from-layer="286" from-port="3" to-layer="289" to-port="2" />
|
| <edge from-layer="287" from-port="0" to-layer="288" to-port="0" />
|
| <edge from-layer="288" from-port="1" to-layer="289" to-port="3" />
|
| <edge from-layer="289" from-port="5" to-layer="291" to-port="0" />
|
| <edge from-layer="290" from-port="0" to-layer="291" to-port="1" />
|
| <edge from-layer="291" from-port="2" to-layer="293" to-port="0" />
|
| <edge from-layer="292" from-port="0" to-layer="293" to-port="1" />
|
| <edge from-layer="293" from-port="2" to-layer="296" to-port="0" />
|
| <edge from-layer="294" from-port="0" to-layer="295" to-port="0" />
|
| <edge from-layer="295" from-port="1" to-layer="296" to-port="1" />
|
| <edge from-layer="296" from-port="2" to-layer="299" to-port="0" />
|
| <edge from-layer="297" from-port="0" to-layer="298" to-port="0" />
|
| <edge from-layer="298" from-port="1" to-layer="299" to-port="1" />
|
| <edge from-layer="299" from-port="2" to-layer="300" to-port="0" />
|
| <edge from-layer="300" from-port="2" to-layer="302" to-port="0" />
|
| <edge from-layer="300" from-port="2" to-layer="322" to-port="1" />
|
| <edge from-layer="301" from-port="0" to-layer="302" to-port="1" />
|
| <edge from-layer="302" from-port="2" to-layer="305" to-port="0" />
|
| <edge from-layer="303" from-port="0" to-layer="304" to-port="0" />
|
| <edge from-layer="304" from-port="1" to-layer="305" to-port="1" />
|
| <edge from-layer="305" from-port="2" to-layer="308" to-port="0" />
|
| <edge from-layer="306" from-port="0" to-layer="307" to-port="0" />
|
| <edge from-layer="307" from-port="1" to-layer="308" to-port="1" />
|
| <edge from-layer="308" from-port="2" to-layer="311" to-port="0" />
|
| <edge from-layer="309" from-port="0" to-layer="310" to-port="0" />
|
| <edge from-layer="310" from-port="1" to-layer="311" to-port="1" />
|
| <edge from-layer="311" from-port="2" to-layer="314" to-port="0" />
|
| <edge from-layer="312" from-port="0" to-layer="313" to-port="0" />
|
| <edge from-layer="313" from-port="1" to-layer="314" to-port="1" />
|
| <edge from-layer="314" from-port="2" to-layer="315" to-port="0" />
|
| <edge from-layer="315" from-port="1" to-layer="318" to-port="0" />
|
| <edge from-layer="316" from-port="0" to-layer="317" to-port="0" />
|
| <edge from-layer="317" from-port="1" to-layer="318" to-port="1" />
|
| <edge from-layer="318" from-port="2" to-layer="321" to-port="0" />
|
| <edge from-layer="319" from-port="0" to-layer="320" to-port="0" />
|
| <edge from-layer="320" from-port="1" to-layer="321" to-port="1" />
|
| <edge from-layer="321" from-port="2" to-layer="322" to-port="0" />
|
| <edge from-layer="322" from-port="2" to-layer="357" to-port="1" />
|
| <edge from-layer="322" from-port="2" to-layer="324" to-port="0" />
|
| <edge from-layer="323" from-port="0" to-layer="324" to-port="1" />
|
| <edge from-layer="324" from-port="2" to-layer="327" to-port="0" />
|
| <edge from-layer="325" from-port="0" to-layer="326" to-port="0" />
|
| <edge from-layer="326" from-port="1" to-layer="327" to-port="1" />
|
| <edge from-layer="327" from-port="2" to-layer="330" to-port="0" />
|
| <edge from-layer="328" from-port="0" to-layer="329" to-port="0" />
|
| <edge from-layer="329" from-port="1" to-layer="330" to-port="1" />
|
| <edge from-layer="330" from-port="2" to-layer="333" to-port="0" />
|
| <edge from-layer="331" from-port="0" to-layer="332" to-port="0" />
|
| <edge from-layer="332" from-port="1" to-layer="333" to-port="1" />
|
| <edge from-layer="333" from-port="2" to-layer="336" to-port="0" />
|
| <edge from-layer="334" from-port="0" to-layer="335" to-port="0" />
|
| <edge from-layer="335" from-port="1" to-layer="336" to-port="1" />
|
| <edge from-layer="336" from-port="2" to-layer="338" to-port="0" />
|
| <edge from-layer="337" from-port="0" to-layer="338" to-port="1" />
|
| <edge from-layer="338" from-port="2" to-layer="340" to-port="0" />
|
| <edge from-layer="339" from-port="0" to-layer="340" to-port="1" />
|
| <edge from-layer="340" from-port="2" to-layer="343" to-port="0" />
|
| <edge from-layer="340" from-port="2" to-layer="342" to-port="0" />
|
| <edge from-layer="340" from-port="2" to-layer="341" to-port="0" />
|
| <edge from-layer="341" from-port="3" to-layer="346" to-port="0" />
|
| <edge from-layer="342" from-port="3" to-layer="346" to-port="1" />
|
| <edge from-layer="343" from-port="3" to-layer="346" to-port="2" />
|
| <edge from-layer="344" from-port="0" to-layer="345" to-port="0" />
|
| <edge from-layer="345" from-port="1" to-layer="346" to-port="3" />
|
| <edge from-layer="346" from-port="5" to-layer="348" to-port="0" />
|
| <edge from-layer="347" from-port="0" to-layer="348" to-port="1" />
|
| <edge from-layer="348" from-port="2" to-layer="350" to-port="0" />
|
| <edge from-layer="349" from-port="0" to-layer="350" to-port="1" />
|
| <edge from-layer="350" from-port="2" to-layer="353" to-port="0" />
|
| <edge from-layer="351" from-port="0" to-layer="352" to-port="0" />
|
| <edge from-layer="352" from-port="1" to-layer="353" to-port="1" />
|
| <edge from-layer="353" from-port="2" to-layer="356" to-port="0" />
|
| <edge from-layer="354" from-port="0" to-layer="355" to-port="0" />
|
| <edge from-layer="355" from-port="1" to-layer="356" to-port="1" />
|
| <edge from-layer="356" from-port="2" to-layer="357" to-port="0" />
|
| <edge from-layer="357" from-port="2" to-layer="379" to-port="1" />
|
| <edge from-layer="357" from-port="2" to-layer="359" to-port="0" />
|
| <edge from-layer="358" from-port="0" to-layer="359" to-port="1" />
|
| <edge from-layer="359" from-port="2" to-layer="362" to-port="0" />
|
| <edge from-layer="360" from-port="0" to-layer="361" to-port="0" />
|
| <edge from-layer="361" from-port="1" to-layer="362" to-port="1" />
|
| <edge from-layer="362" from-port="2" to-layer="365" to-port="0" />
|
| <edge from-layer="363" from-port="0" to-layer="364" to-port="0" />
|
| <edge from-layer="364" from-port="1" to-layer="365" to-port="1" />
|
| <edge from-layer="365" from-port="2" to-layer="368" to-port="0" />
|
| <edge from-layer="366" from-port="0" to-layer="367" to-port="0" />
|
| <edge from-layer="367" from-port="1" to-layer="368" to-port="1" />
|
| <edge from-layer="368" from-port="2" to-layer="371" to-port="0" />
|
| <edge from-layer="369" from-port="0" to-layer="370" to-port="0" />
|
| <edge from-layer="370" from-port="1" to-layer="371" to-port="1" />
|
| <edge from-layer="371" from-port="2" to-layer="372" to-port="0" />
|
| <edge from-layer="372" from-port="1" to-layer="375" to-port="0" />
|
| <edge from-layer="373" from-port="0" to-layer="374" to-port="0" />
|
| <edge from-layer="374" from-port="1" to-layer="375" to-port="1" />
|
| <edge from-layer="375" from-port="2" to-layer="378" to-port="0" />
|
| <edge from-layer="376" from-port="0" to-layer="377" to-port="0" />
|
| <edge from-layer="377" from-port="1" to-layer="378" to-port="1" />
|
| <edge from-layer="378" from-port="2" to-layer="379" to-port="0" />
|
| <edge from-layer="379" from-port="2" to-layer="381" to-port="0" />
|
| <edge from-layer="379" from-port="2" to-layer="414" to-port="1" />
|
| <edge from-layer="380" from-port="0" to-layer="381" to-port="1" />
|
| <edge from-layer="381" from-port="2" to-layer="384" to-port="0" />
|
| <edge from-layer="382" from-port="0" to-layer="383" to-port="0" />
|
| <edge from-layer="383" from-port="1" to-layer="384" to-port="1" />
|
| <edge from-layer="384" from-port="2" to-layer="387" to-port="0" />
|
| <edge from-layer="385" from-port="0" to-layer="386" to-port="0" />
|
| <edge from-layer="386" from-port="1" to-layer="387" to-port="1" />
|
| <edge from-layer="387" from-port="2" to-layer="390" to-port="0" />
|
| <edge from-layer="388" from-port="0" to-layer="389" to-port="0" />
|
| <edge from-layer="389" from-port="1" to-layer="390" to-port="1" />
|
| <edge from-layer="390" from-port="2" to-layer="393" to-port="0" />
|
| <edge from-layer="391" from-port="0" to-layer="392" to-port="0" />
|
| <edge from-layer="392" from-port="1" to-layer="393" to-port="1" />
|
| <edge from-layer="393" from-port="2" to-layer="395" to-port="0" />
|
| <edge from-layer="394" from-port="0" to-layer="395" to-port="1" />
|
| <edge from-layer="395" from-port="2" to-layer="397" to-port="0" />
|
| <edge from-layer="396" from-port="0" to-layer="397" to-port="1" />
|
| <edge from-layer="397" from-port="2" to-layer="398" to-port="0" />
|
| <edge from-layer="397" from-port="2" to-layer="399" to-port="0" />
|
| <edge from-layer="397" from-port="2" to-layer="400" to-port="0" />
|
| <edge from-layer="398" from-port="3" to-layer="403" to-port="0" />
|
| <edge from-layer="399" from-port="3" to-layer="403" to-port="1" />
|
| <edge from-layer="400" from-port="3" to-layer="403" to-port="2" />
|
| <edge from-layer="401" from-port="0" to-layer="402" to-port="0" />
|
| <edge from-layer="402" from-port="1" to-layer="403" to-port="3" />
|
| <edge from-layer="403" from-port="5" to-layer="405" to-port="0" />
|
| <edge from-layer="404" from-port="0" to-layer="405" to-port="1" />
|
| <edge from-layer="405" from-port="2" to-layer="407" to-port="0" />
|
| <edge from-layer="406" from-port="0" to-layer="407" to-port="1" />
|
| <edge from-layer="407" from-port="2" to-layer="410" to-port="0" />
|
| <edge from-layer="408" from-port="0" to-layer="409" to-port="0" />
|
| <edge from-layer="409" from-port="1" to-layer="410" to-port="1" />
|
| <edge from-layer="410" from-port="2" to-layer="413" to-port="0" />
|
| <edge from-layer="411" from-port="0" to-layer="412" to-port="0" />
|
| <edge from-layer="412" from-port="1" to-layer="413" to-port="1" />
|
| <edge from-layer="413" from-port="2" to-layer="414" to-port="0" />
|
| <edge from-layer="414" from-port="2" to-layer="436" to-port="1" />
|
| <edge from-layer="414" from-port="2" to-layer="416" to-port="0" />
|
| <edge from-layer="415" from-port="0" to-layer="416" to-port="1" />
|
| <edge from-layer="416" from-port="2" to-layer="419" to-port="0" />
|
| <edge from-layer="417" from-port="0" to-layer="418" to-port="0" />
|
| <edge from-layer="418" from-port="1" to-layer="419" to-port="1" />
|
| <edge from-layer="419" from-port="2" to-layer="422" to-port="0" />
|
| <edge from-layer="420" from-port="0" to-layer="421" to-port="0" />
|
| <edge from-layer="421" from-port="1" to-layer="422" to-port="1" />
|
| <edge from-layer="422" from-port="2" to-layer="425" to-port="0" />
|
| <edge from-layer="423" from-port="0" to-layer="424" to-port="0" />
|
| <edge from-layer="424" from-port="1" to-layer="425" to-port="1" />
|
| <edge from-layer="425" from-port="2" to-layer="428" to-port="0" />
|
| <edge from-layer="426" from-port="0" to-layer="427" to-port="0" />
|
| <edge from-layer="427" from-port="1" to-layer="428" to-port="1" />
|
| <edge from-layer="428" from-port="2" to-layer="429" to-port="0" />
|
| <edge from-layer="429" from-port="1" to-layer="432" to-port="0" />
|
| <edge from-layer="430" from-port="0" to-layer="431" to-port="0" />
|
| <edge from-layer="431" from-port="1" to-layer="432" to-port="1" />
|
| <edge from-layer="432" from-port="2" to-layer="435" to-port="0" />
|
| <edge from-layer="433" from-port="0" to-layer="434" to-port="0" />
|
| <edge from-layer="434" from-port="1" to-layer="435" to-port="1" />
|
| <edge from-layer="435" from-port="2" to-layer="436" to-port="0" />
|
| <edge from-layer="436" from-port="2" to-layer="438" to-port="0" />
|
| <edge from-layer="436" from-port="2" to-layer="471" to-port="1" />
|
| <edge from-layer="437" from-port="0" to-layer="438" to-port="1" />
|
| <edge from-layer="438" from-port="2" to-layer="441" to-port="0" />
|
| <edge from-layer="439" from-port="0" to-layer="440" to-port="0" />
|
| <edge from-layer="440" from-port="1" to-layer="441" to-port="1" />
|
| <edge from-layer="441" from-port="2" to-layer="444" to-port="0" />
|
| <edge from-layer="442" from-port="0" to-layer="443" to-port="0" />
|
| <edge from-layer="443" from-port="1" to-layer="444" to-port="1" />
|
| <edge from-layer="444" from-port="2" to-layer="447" to-port="0" />
|
| <edge from-layer="445" from-port="0" to-layer="446" to-port="0" />
|
| <edge from-layer="446" from-port="1" to-layer="447" to-port="1" />
|
| <edge from-layer="447" from-port="2" to-layer="450" to-port="0" />
|
| <edge from-layer="448" from-port="0" to-layer="449" to-port="0" />
|
| <edge from-layer="449" from-port="1" to-layer="450" to-port="1" />
|
| <edge from-layer="450" from-port="2" to-layer="452" to-port="0" />
|
| <edge from-layer="451" from-port="0" to-layer="452" to-port="1" />
|
| <edge from-layer="452" from-port="2" to-layer="454" to-port="0" />
|
| <edge from-layer="453" from-port="0" to-layer="454" to-port="1" />
|
| <edge from-layer="454" from-port="2" to-layer="457" to-port="0" />
|
| <edge from-layer="454" from-port="2" to-layer="455" to-port="0" />
|
| <edge from-layer="454" from-port="2" to-layer="456" to-port="0" />
|
| <edge from-layer="455" from-port="3" to-layer="460" to-port="0" />
|
| <edge from-layer="456" from-port="3" to-layer="460" to-port="1" />
|
| <edge from-layer="457" from-port="3" to-layer="460" to-port="2" />
|
| <edge from-layer="458" from-port="0" to-layer="459" to-port="0" />
|
| <edge from-layer="459" from-port="1" to-layer="460" to-port="3" />
|
| <edge from-layer="460" from-port="5" to-layer="462" to-port="0" />
|
| <edge from-layer="461" from-port="0" to-layer="462" to-port="1" />
|
| <edge from-layer="462" from-port="2" to-layer="464" to-port="0" />
|
| <edge from-layer="463" from-port="0" to-layer="464" to-port="1" />
|
| <edge from-layer="464" from-port="2" to-layer="467" to-port="0" />
|
| <edge from-layer="465" from-port="0" to-layer="466" to-port="0" />
|
| <edge from-layer="466" from-port="1" to-layer="467" to-port="1" />
|
| <edge from-layer="467" from-port="2" to-layer="470" to-port="0" />
|
| <edge from-layer="468" from-port="0" to-layer="469" to-port="0" />
|
| <edge from-layer="469" from-port="1" to-layer="470" to-port="1" />
|
| <edge from-layer="470" from-port="2" to-layer="471" to-port="0" />
|
| <edge from-layer="471" from-port="2" to-layer="493" to-port="1" />
|
| <edge from-layer="471" from-port="2" to-layer="473" to-port="0" />
|
| <edge from-layer="472" from-port="0" to-layer="473" to-port="1" />
|
| <edge from-layer="473" from-port="2" to-layer="476" to-port="0" />
|
| <edge from-layer="474" from-port="0" to-layer="475" to-port="0" />
|
| <edge from-layer="475" from-port="1" to-layer="476" to-port="1" />
|
| <edge from-layer="476" from-port="2" to-layer="479" to-port="0" />
|
| <edge from-layer="477" from-port="0" to-layer="478" to-port="0" />
|
| <edge from-layer="478" from-port="1" to-layer="479" to-port="1" />
|
| <edge from-layer="479" from-port="2" to-layer="482" to-port="0" />
|
| <edge from-layer="480" from-port="0" to-layer="481" to-port="0" />
|
| <edge from-layer="481" from-port="1" to-layer="482" to-port="1" />
|
| <edge from-layer="482" from-port="2" to-layer="485" to-port="0" />
|
| <edge from-layer="483" from-port="0" to-layer="484" to-port="0" />
|
| <edge from-layer="484" from-port="1" to-layer="485" to-port="1" />
|
| <edge from-layer="485" from-port="2" to-layer="486" to-port="0" />
|
| <edge from-layer="486" from-port="1" to-layer="489" to-port="0" />
|
| <edge from-layer="487" from-port="0" to-layer="488" to-port="0" />
|
| <edge from-layer="488" from-port="1" to-layer="489" to-port="1" />
|
| <edge from-layer="489" from-port="2" to-layer="492" to-port="0" />
|
| <edge from-layer="490" from-port="0" to-layer="491" to-port="0" />
|
| <edge from-layer="491" from-port="1" to-layer="492" to-port="1" />
|
| <edge from-layer="492" from-port="2" to-layer="493" to-port="0" />
|
| <edge from-layer="493" from-port="2" to-layer="495" to-port="0" />
|
| <edge from-layer="493" from-port="2" to-layer="528" to-port="1" />
|
| <edge from-layer="494" from-port="0" to-layer="495" to-port="1" />
|
| <edge from-layer="495" from-port="2" to-layer="498" to-port="0" />
|
| <edge from-layer="496" from-port="0" to-layer="497" to-port="0" />
|
| <edge from-layer="497" from-port="1" to-layer="498" to-port="1" />
|
| <edge from-layer="498" from-port="2" to-layer="501" to-port="0" />
|
| <edge from-layer="499" from-port="0" to-layer="500" to-port="0" />
|
| <edge from-layer="500" from-port="1" to-layer="501" to-port="1" />
|
| <edge from-layer="501" from-port="2" to-layer="504" to-port="0" />
|
| <edge from-layer="502" from-port="0" to-layer="503" to-port="0" />
|
| <edge from-layer="503" from-port="1" to-layer="504" to-port="1" />
|
| <edge from-layer="504" from-port="2" to-layer="507" to-port="0" />
|
| <edge from-layer="505" from-port="0" to-layer="506" to-port="0" />
|
| <edge from-layer="506" from-port="1" to-layer="507" to-port="1" />
|
| <edge from-layer="507" from-port="2" to-layer="509" to-port="0" />
|
| <edge from-layer="508" from-port="0" to-layer="509" to-port="1" />
|
| <edge from-layer="509" from-port="2" to-layer="511" to-port="0" />
|
| <edge from-layer="510" from-port="0" to-layer="511" to-port="1" />
|
| <edge from-layer="511" from-port="2" to-layer="514" to-port="0" />
|
| <edge from-layer="511" from-port="2" to-layer="513" to-port="0" />
|
| <edge from-layer="511" from-port="2" to-layer="512" to-port="0" />
|
| <edge from-layer="512" from-port="3" to-layer="517" to-port="0" />
|
| <edge from-layer="513" from-port="3" to-layer="517" to-port="1" />
|
| <edge from-layer="514" from-port="3" to-layer="517" to-port="2" />
|
| <edge from-layer="515" from-port="0" to-layer="516" to-port="0" />
|
| <edge from-layer="516" from-port="1" to-layer="517" to-port="3" />
|
| <edge from-layer="517" from-port="5" to-layer="519" to-port="0" />
|
| <edge from-layer="518" from-port="0" to-layer="519" to-port="1" />
|
| <edge from-layer="519" from-port="2" to-layer="521" to-port="0" />
|
| <edge from-layer="520" from-port="0" to-layer="521" to-port="1" />
|
| <edge from-layer="521" from-port="2" to-layer="524" to-port="0" />
|
| <edge from-layer="522" from-port="0" to-layer="523" to-port="0" />
|
| <edge from-layer="523" from-port="1" to-layer="524" to-port="1" />
|
| <edge from-layer="524" from-port="2" to-layer="527" to-port="0" />
|
| <edge from-layer="525" from-port="0" to-layer="526" to-port="0" />
|
| <edge from-layer="526" from-port="1" to-layer="527" to-port="1" />
|
| <edge from-layer="527" from-port="2" to-layer="528" to-port="0" />
|
| <edge from-layer="528" from-port="2" to-layer="530" to-port="0" />
|
| <edge from-layer="528" from-port="2" to-layer="550" to-port="1" />
|
| <edge from-layer="529" from-port="0" to-layer="530" to-port="1" />
|
| <edge from-layer="530" from-port="2" to-layer="533" to-port="0" />
|
| <edge from-layer="531" from-port="0" to-layer="532" to-port="0" />
|
| <edge from-layer="532" from-port="1" to-layer="533" to-port="1" />
|
| <edge from-layer="533" from-port="2" to-layer="536" to-port="0" />
|
| <edge from-layer="534" from-port="0" to-layer="535" to-port="0" />
|
| <edge from-layer="535" from-port="1" to-layer="536" to-port="1" />
|
| <edge from-layer="536" from-port="2" to-layer="539" to-port="0" />
|
| <edge from-layer="537" from-port="0" to-layer="538" to-port="0" />
|
| <edge from-layer="538" from-port="1" to-layer="539" to-port="1" />
|
| <edge from-layer="539" from-port="2" to-layer="542" to-port="0" />
|
| <edge from-layer="540" from-port="0" to-layer="541" to-port="0" />
|
| <edge from-layer="541" from-port="1" to-layer="542" to-port="1" />
|
| <edge from-layer="542" from-port="2" to-layer="543" to-port="0" />
|
| <edge from-layer="543" from-port="1" to-layer="546" to-port="0" />
|
| <edge from-layer="544" from-port="0" to-layer="545" to-port="0" />
|
| <edge from-layer="545" from-port="1" to-layer="546" to-port="1" />
|
| <edge from-layer="546" from-port="2" to-layer="549" to-port="0" />
|
| <edge from-layer="547" from-port="0" to-layer="548" to-port="0" />
|
| <edge from-layer="548" from-port="1" to-layer="549" to-port="1" />
|
| <edge from-layer="549" from-port="2" to-layer="550" to-port="0" />
|
| <edge from-layer="550" from-port="2" to-layer="552" to-port="0" />
|
| <edge from-layer="550" from-port="2" to-layer="585" to-port="1" />
|
| <edge from-layer="551" from-port="0" to-layer="552" to-port="1" />
|
| <edge from-layer="552" from-port="2" to-layer="555" to-port="0" />
|
| <edge from-layer="553" from-port="0" to-layer="554" to-port="0" />
|
| <edge from-layer="554" from-port="1" to-layer="555" to-port="1" />
|
| <edge from-layer="555" from-port="2" to-layer="558" to-port="0" />
|
| <edge from-layer="556" from-port="0" to-layer="557" to-port="0" />
|
| <edge from-layer="557" from-port="1" to-layer="558" to-port="1" />
|
| <edge from-layer="558" from-port="2" to-layer="561" to-port="0" />
|
| <edge from-layer="559" from-port="0" to-layer="560" to-port="0" />
|
| <edge from-layer="560" from-port="1" to-layer="561" to-port="1" />
|
| <edge from-layer="561" from-port="2" to-layer="564" to-port="0" />
|
| <edge from-layer="562" from-port="0" to-layer="563" to-port="0" />
|
| <edge from-layer="563" from-port="1" to-layer="564" to-port="1" />
|
| <edge from-layer="564" from-port="2" to-layer="566" to-port="0" />
|
| <edge from-layer="565" from-port="0" to-layer="566" to-port="1" />
|
| <edge from-layer="566" from-port="2" to-layer="568" to-port="0" />
|
| <edge from-layer="567" from-port="0" to-layer="568" to-port="1" />
|
| <edge from-layer="568" from-port="2" to-layer="569" to-port="0" />
|
| <edge from-layer="568" from-port="2" to-layer="570" to-port="0" />
|
| <edge from-layer="568" from-port="2" to-layer="571" to-port="0" />
|
| <edge from-layer="569" from-port="3" to-layer="574" to-port="0" />
|
| <edge from-layer="570" from-port="3" to-layer="574" to-port="1" />
|
| <edge from-layer="571" from-port="3" to-layer="574" to-port="2" />
|
| <edge from-layer="572" from-port="0" to-layer="573" to-port="0" />
|
| <edge from-layer="573" from-port="1" to-layer="574" to-port="3" />
|
| <edge from-layer="574" from-port="5" to-layer="576" to-port="0" />
|
| <edge from-layer="575" from-port="0" to-layer="576" to-port="1" />
|
| <edge from-layer="576" from-port="2" to-layer="578" to-port="0" />
|
| <edge from-layer="577" from-port="0" to-layer="578" to-port="1" />
|
| <edge from-layer="578" from-port="2" to-layer="581" to-port="0" />
|
| <edge from-layer="579" from-port="0" to-layer="580" to-port="0" />
|
| <edge from-layer="580" from-port="1" to-layer="581" to-port="1" />
|
| <edge from-layer="581" from-port="2" to-layer="584" to-port="0" />
|
| <edge from-layer="582" from-port="0" to-layer="583" to-port="0" />
|
| <edge from-layer="583" from-port="1" to-layer="584" to-port="1" />
|
| <edge from-layer="584" from-port="2" to-layer="585" to-port="0" />
|
| <edge from-layer="585" from-port="2" to-layer="587" to-port="0" />
|
| <edge from-layer="585" from-port="2" to-layer="607" to-port="1" />
|
| <edge from-layer="586" from-port="0" to-layer="587" to-port="1" />
|
| <edge from-layer="587" from-port="2" to-layer="590" to-port="0" />
|
| <edge from-layer="588" from-port="0" to-layer="589" to-port="0" />
|
| <edge from-layer="589" from-port="1" to-layer="590" to-port="1" />
|
| <edge from-layer="590" from-port="2" to-layer="593" to-port="0" />
|
| <edge from-layer="591" from-port="0" to-layer="592" to-port="0" />
|
| <edge from-layer="592" from-port="1" to-layer="593" to-port="1" />
|
| <edge from-layer="593" from-port="2" to-layer="596" to-port="0" />
|
| <edge from-layer="594" from-port="0" to-layer="595" to-port="0" />
|
| <edge from-layer="595" from-port="1" to-layer="596" to-port="1" />
|
| <edge from-layer="596" from-port="2" to-layer="599" to-port="0" />
|
| <edge from-layer="597" from-port="0" to-layer="598" to-port="0" />
|
| <edge from-layer="598" from-port="1" to-layer="599" to-port="1" />
|
| <edge from-layer="599" from-port="2" to-layer="600" to-port="0" />
|
| <edge from-layer="600" from-port="1" to-layer="603" to-port="0" />
|
| <edge from-layer="601" from-port="0" to-layer="602" to-port="0" />
|
| <edge from-layer="602" from-port="1" to-layer="603" to-port="1" />
|
| <edge from-layer="603" from-port="2" to-layer="606" to-port="0" />
|
| <edge from-layer="604" from-port="0" to-layer="605" to-port="0" />
|
| <edge from-layer="605" from-port="1" to-layer="606" to-port="1" />
|
| <edge from-layer="606" from-port="2" to-layer="607" to-port="0" />
|
| <edge from-layer="607" from-port="2" to-layer="609" to-port="0" />
|
| <edge from-layer="607" from-port="2" to-layer="642" to-port="1" />
|
| <edge from-layer="608" from-port="0" to-layer="609" to-port="1" />
|
| <edge from-layer="609" from-port="2" to-layer="612" to-port="0" />
|
| <edge from-layer="610" from-port="0" to-layer="611" to-port="0" />
|
| <edge from-layer="611" from-port="1" to-layer="612" to-port="1" />
|
| <edge from-layer="612" from-port="2" to-layer="615" to-port="0" />
|
| <edge from-layer="613" from-port="0" to-layer="614" to-port="0" />
|
| <edge from-layer="614" from-port="1" to-layer="615" to-port="1" />
|
| <edge from-layer="615" from-port="2" to-layer="618" to-port="0" />
|
| <edge from-layer="616" from-port="0" to-layer="617" to-port="0" />
|
| <edge from-layer="617" from-port="1" to-layer="618" to-port="1" />
|
| <edge from-layer="618" from-port="2" to-layer="621" to-port="0" />
|
| <edge from-layer="619" from-port="0" to-layer="620" to-port="0" />
|
| <edge from-layer="620" from-port="1" to-layer="621" to-port="1" />
|
| <edge from-layer="621" from-port="2" to-layer="623" to-port="0" />
|
| <edge from-layer="622" from-port="0" to-layer="623" to-port="1" />
|
| <edge from-layer="623" from-port="2" to-layer="625" to-port="0" />
|
| <edge from-layer="624" from-port="0" to-layer="625" to-port="1" />
|
| <edge from-layer="625" from-port="2" to-layer="626" to-port="0" />
|
| <edge from-layer="625" from-port="2" to-layer="627" to-port="0" />
|
| <edge from-layer="625" from-port="2" to-layer="628" to-port="0" />
|
| <edge from-layer="626" from-port="3" to-layer="631" to-port="0" />
|
| <edge from-layer="627" from-port="3" to-layer="631" to-port="1" />
|
| <edge from-layer="628" from-port="3" to-layer="631" to-port="2" />
|
| <edge from-layer="629" from-port="0" to-layer="630" to-port="0" />
|
| <edge from-layer="630" from-port="1" to-layer="631" to-port="3" />
|
| <edge from-layer="631" from-port="5" to-layer="633" to-port="0" />
|
| <edge from-layer="632" from-port="0" to-layer="633" to-port="1" />
|
| <edge from-layer="633" from-port="2" to-layer="635" to-port="0" />
|
| <edge from-layer="634" from-port="0" to-layer="635" to-port="1" />
|
| <edge from-layer="635" from-port="2" to-layer="638" to-port="0" />
|
| <edge from-layer="636" from-port="0" to-layer="637" to-port="0" />
|
| <edge from-layer="637" from-port="1" to-layer="638" to-port="1" />
|
| <edge from-layer="638" from-port="2" to-layer="641" to-port="0" />
|
| <edge from-layer="639" from-port="0" to-layer="640" to-port="0" />
|
| <edge from-layer="640" from-port="1" to-layer="641" to-port="1" />
|
| <edge from-layer="641" from-port="2" to-layer="642" to-port="0" />
|
| <edge from-layer="642" from-port="2" to-layer="644" to-port="0" />
|
| <edge from-layer="642" from-port="2" to-layer="664" to-port="1" />
|
| <edge from-layer="643" from-port="0" to-layer="644" to-port="1" />
|
| <edge from-layer="644" from-port="2" to-layer="647" to-port="0" />
|
| <edge from-layer="645" from-port="0" to-layer="646" to-port="0" />
|
| <edge from-layer="646" from-port="1" to-layer="647" to-port="1" />
|
| <edge from-layer="647" from-port="2" to-layer="650" to-port="0" />
|
| <edge from-layer="648" from-port="0" to-layer="649" to-port="0" />
|
| <edge from-layer="649" from-port="1" to-layer="650" to-port="1" />
|
| <edge from-layer="650" from-port="2" to-layer="653" to-port="0" />
|
| <edge from-layer="651" from-port="0" to-layer="652" to-port="0" />
|
| <edge from-layer="652" from-port="1" to-layer="653" to-port="1" />
|
| <edge from-layer="653" from-port="2" to-layer="656" to-port="0" />
|
| <edge from-layer="654" from-port="0" to-layer="655" to-port="0" />
|
| <edge from-layer="655" from-port="1" to-layer="656" to-port="1" />
|
| <edge from-layer="656" from-port="2" to-layer="657" to-port="0" />
|
| <edge from-layer="657" from-port="1" to-layer="660" to-port="0" />
|
| <edge from-layer="658" from-port="0" to-layer="659" to-port="0" />
|
| <edge from-layer="659" from-port="1" to-layer="660" to-port="1" />
|
| <edge from-layer="660" from-port="2" to-layer="663" to-port="0" />
|
| <edge from-layer="661" from-port="0" to-layer="662" to-port="0" />
|
| <edge from-layer="662" from-port="1" to-layer="663" to-port="1" />
|
| <edge from-layer="663" from-port="2" to-layer="664" to-port="0" />
|
| <edge from-layer="664" from-port="2" to-layer="699" to-port="1" />
|
| <edge from-layer="664" from-port="2" to-layer="666" to-port="0" />
|
| <edge from-layer="665" from-port="0" to-layer="666" to-port="1" />
|
| <edge from-layer="666" from-port="2" to-layer="669" to-port="0" />
|
| <edge from-layer="667" from-port="0" to-layer="668" to-port="0" />
|
| <edge from-layer="668" from-port="1" to-layer="669" to-port="1" />
|
| <edge from-layer="669" from-port="2" to-layer="672" to-port="0" />
|
| <edge from-layer="670" from-port="0" to-layer="671" to-port="0" />
|
| <edge from-layer="671" from-port="1" to-layer="672" to-port="1" />
|
| <edge from-layer="672" from-port="2" to-layer="675" to-port="0" />
|
| <edge from-layer="673" from-port="0" to-layer="674" to-port="0" />
|
| <edge from-layer="674" from-port="1" to-layer="675" to-port="1" />
|
| <edge from-layer="675" from-port="2" to-layer="678" to-port="0" />
|
| <edge from-layer="676" from-port="0" to-layer="677" to-port="0" />
|
| <edge from-layer="677" from-port="1" to-layer="678" to-port="1" />
|
| <edge from-layer="678" from-port="2" to-layer="680" to-port="0" />
|
| <edge from-layer="679" from-port="0" to-layer="680" to-port="1" />
|
| <edge from-layer="680" from-port="2" to-layer="682" to-port="0" />
|
| <edge from-layer="681" from-port="0" to-layer="682" to-port="1" />
|
| <edge from-layer="682" from-port="2" to-layer="684" to-port="0" />
|
| <edge from-layer="682" from-port="2" to-layer="685" to-port="0" />
|
| <edge from-layer="682" from-port="2" to-layer="683" to-port="0" />
|
| <edge from-layer="683" from-port="3" to-layer="688" to-port="0" />
|
| <edge from-layer="684" from-port="3" to-layer="688" to-port="1" />
|
| <edge from-layer="685" from-port="3" to-layer="688" to-port="2" />
|
| <edge from-layer="686" from-port="0" to-layer="687" to-port="0" />
|
| <edge from-layer="687" from-port="1" to-layer="688" to-port="3" />
|
| <edge from-layer="688" from-port="5" to-layer="690" to-port="0" />
|
| <edge from-layer="689" from-port="0" to-layer="690" to-port="1" />
|
| <edge from-layer="690" from-port="2" to-layer="692" to-port="0" />
|
| <edge from-layer="691" from-port="0" to-layer="692" to-port="1" />
|
| <edge from-layer="692" from-port="2" to-layer="695" to-port="0" />
|
| <edge from-layer="693" from-port="0" to-layer="694" to-port="0" />
|
| <edge from-layer="694" from-port="1" to-layer="695" to-port="1" />
|
| <edge from-layer="695" from-port="2" to-layer="698" to-port="0" />
|
| <edge from-layer="696" from-port="0" to-layer="697" to-port="0" />
|
| <edge from-layer="697" from-port="1" to-layer="698" to-port="1" />
|
| <edge from-layer="698" from-port="2" to-layer="699" to-port="0" />
|
| <edge from-layer="699" from-port="2" to-layer="701" to-port="0" />
|
| <edge from-layer="699" from-port="2" to-layer="721" to-port="1" />
|
| <edge from-layer="700" from-port="0" to-layer="701" to-port="1" />
|
| <edge from-layer="701" from-port="2" to-layer="704" to-port="0" />
|
| <edge from-layer="702" from-port="0" to-layer="703" to-port="0" />
|
| <edge from-layer="703" from-port="1" to-layer="704" to-port="1" />
|
| <edge from-layer="704" from-port="2" to-layer="707" to-port="0" />
|
| <edge from-layer="705" from-port="0" to-layer="706" to-port="0" />
|
| <edge from-layer="706" from-port="1" to-layer="707" to-port="1" />
|
| <edge from-layer="707" from-port="2" to-layer="710" to-port="0" />
|
| <edge from-layer="708" from-port="0" to-layer="709" to-port="0" />
|
| <edge from-layer="709" from-port="1" to-layer="710" to-port="1" />
|
| <edge from-layer="710" from-port="2" to-layer="713" to-port="0" />
|
| <edge from-layer="711" from-port="0" to-layer="712" to-port="0" />
|
| <edge from-layer="712" from-port="1" to-layer="713" to-port="1" />
|
| <edge from-layer="713" from-port="2" to-layer="714" to-port="0" />
|
| <edge from-layer="714" from-port="1" to-layer="717" to-port="0" />
|
| <edge from-layer="715" from-port="0" to-layer="716" to-port="0" />
|
| <edge from-layer="716" from-port="1" to-layer="717" to-port="1" />
|
| <edge from-layer="717" from-port="2" to-layer="720" to-port="0" />
|
| <edge from-layer="718" from-port="0" to-layer="719" to-port="0" />
|
| <edge from-layer="719" from-port="1" to-layer="720" to-port="1" />
|
| <edge from-layer="720" from-port="2" to-layer="721" to-port="0" />
|
| <edge from-layer="721" from-port="2" to-layer="723" to-port="0" />
|
| <edge from-layer="722" from-port="0" to-layer="723" to-port="1" />
|
| <edge from-layer="723" from-port="2" to-layer="726" to-port="0" />
|
| <edge from-layer="724" from-port="0" to-layer="725" to-port="0" />
|
| <edge from-layer="725" from-port="1" to-layer="726" to-port="1" />
|
| <edge from-layer="726" from-port="2" to-layer="729" to-port="0" />
|
| <edge from-layer="727" from-port="0" to-layer="728" to-port="0" />
|
| <edge from-layer="728" from-port="1" to-layer="729" to-port="1" />
|
| <edge from-layer="729" from-port="2" to-layer="732" to-port="0" />
|
| <edge from-layer="729" from-port="2" to-layer="742" to-port="0" />
|
| <edge from-layer="730" from-port="0" to-layer="732" to-port="1" />
|
| <edge from-layer="731" from-port="0" to-layer="732" to-port="2" />
|
| <edge from-layer="732" from-port="3" to-layer="734" to-port="0" />
|
| <edge from-layer="733" from-port="0" to-layer="734" to-port="1" />
|
| <edge from-layer="734" from-port="2" to-layer="737" to-port="0" />
|
| <edge from-layer="735" from-port="0" to-layer="736" to-port="0" />
|
| <edge from-layer="736" from-port="1" to-layer="737" to-port="1" />
|
| <edge from-layer="737" from-port="2" to-layer="740" to-port="0" />
|
| <edge from-layer="738" from-port="0" to-layer="739" to-port="0" />
|
| <edge from-layer="739" from-port="1" to-layer="740" to-port="1" />
|
| <edge from-layer="740" from-port="2" to-layer="741" to-port="0" />
|
| </edges>
|
| <rt_info>
|
| <Runtime_version value="2025.3.0-19500-3ee669d7d10" />
|
| <conversion_parameters>
|
| <framework value="pytorch" />
|
| <is_python_object value="True" />
|
| </conversion_parameters>
|
| </rt_info>
|
| </net>
|
|
|