| <?xml version="1.0"?> |
| <net name="Model0" version="11"> |
| <layers> |
| <layer id="0" name="image_feature" type="Parameter" version="opset1"> |
| <data shape="?,?,?" element_type="f32" /> |
| <output> |
| <port id="0" precision="FP32" names="image_feature"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="1" name="pos_embed" type="Parameter" version="opset1"> |
| <data shape="?,?,?" element_type="f32" /> |
| <output> |
| <port id="0" precision="FP32" names="pos_embed"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="2" name="key_padding_mask" type="Parameter" version="opset1"> |
| <data shape="?,?" element_type="f32" /> |
| <output> |
| <port id="0" precision="FP32" names="key_padding_mask"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="3" name="Constant_9686" type="Const" version="opset1"> |
| <data element_type="i64" shape="4" offset="0" size="32" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>4</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="4" name="__module.attn/aten::view/Reshape_1" type="Reshape" version="opset1"> |
| <data special_zero="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>4</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="111"> |
| <dim>-1</dim> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>-1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="5" name="__module.attn/aten::expand/Abs" type="Const" version="opset1"> |
| <data element_type="i64" shape="4" offset="32" size="32" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>4</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="6" name="__module.attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> |
| <data mode="bidirectional" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>-1</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>4</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="113"> |
| <dim>-1</dim> |
| <dim>20</dim> |
| <dim>1</dim> |
| <dim>-1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="7" name="ShapeOf_9654" type="ShapeOf" version="opset3"> |
| <data output_type="i64" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="8" name="Constant_9655" type="Const" version="opset1"> |
| <data element_type="i64" shape="1" offset="64" size="8" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="9" name="Constant_9656" type="Const" version="opset1"> |
| <data element_type="i64" shape="" offset="64" size="8" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64" /> |
| </output> |
| </layer> |
| <layer id="10" name="Gather_9657" type="Gather" version="opset8"> |
| <data batch_dims="0" /> |
| <input> |
| <port id="0" precision="I64"> |
| <dim>3</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>1</dim> |
| </port> |
| <port id="2" precision="I64" /> |
| </input> |
| <output> |
| <port id="3" precision="I64" names="12,14,73"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="11" name="Constant_7566" type="Const" version="opset1"> |
| <data element_type="i64" shape="1" offset="72" size="8" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="12" name="__module.attn/aten::mul/Multiply" type="Multiply" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="I64"> |
| <dim>1</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="I64" names="104,105,114,115,92,93,98,99"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="13" name="Constant_326" type="Const" version="opset1"> |
| <data element_type="i64" shape="1" offset="80" size="8" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="14" name="Constant_9665" type="Const" version="opset1"> |
| <data element_type="i64" shape="1" offset="80" size="8" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="15" name="Constant_9666" type="Const" version="opset1"> |
| <data element_type="i64" shape="" offset="64" size="8" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64" /> |
| </output> |
| </layer> |
| <layer id="16" name="Gather_9667" type="Gather" version="opset8"> |
| <data batch_dims="0" /> |
| <input> |
| <port id="0" precision="I64"> |
| <dim>3</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>1</dim> |
| </port> |
| <port id="2" precision="I64" /> |
| </input> |
| <output> |
| <port id="3" precision="I64" names="103,109,97"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="17" name="__module.attn/prim::ListConstruct_2" type="Concat" version="opset1"> |
| <data axis="0" /> |
| <input> |
| <port id="0" precision="I64"> |
| <dim>1</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>1</dim> |
| </port> |
| <port id="2" precision="I64"> |
| <dim>1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="3" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="18" name="__module.attn/aten::reshape/Reshape" type="Reshape" version="opset1"> |
| <data special_zero="false" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>20</dim> |
| <dim>1</dim> |
| <dim>-1</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="117,key_padding_mask_1"> |
| <dim>-1</dim> |
| <dim>1</dim> |
| <dim>-1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="19" name="aten::unsqueeze/Unsqueeze_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="64, 1, 2560" offset="88" size="327680" /> |
| <output> |
| <port id="0" precision="FP16" names="24"> |
| <dim>64</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="20" name="aten::unsqueeze/Unsqueeze" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>64</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>64</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="21" name="Constant_891" type="Const" version="opset1"> |
| <data element_type="i64" shape="1" offset="80" size="8" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="22" name="Constant_898" type="Const" version="opset1"> |
| <data element_type="i64" shape="1" offset="80" size="8" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="23" name="prim::ListConstruct/Concat" type="Concat" version="opset1"> |
| <data axis="0" /> |
| <input> |
| <port id="0" precision="I64"> |
| <dim>1</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>1</dim> |
| </port> |
| <port id="2" precision="I64"> |
| <dim>1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="3" precision="I64" names="27"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="24" name="aten::repeat/Tile" type="Tile" version="opset1"> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>64</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="28,query.1"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="25" name="__module.attn/prim::ListUnpack/VariadicSplit.0_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="2560, 2560" offset="327768" size="13107200" /> |
| <output> |
| <port id="0" precision="FP16" names="82,w_q"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="26" name="__module.attn/prim::ListUnpack/VariadicSplit.0" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="27" name="__module.attn/aten::linear/MatMul_1" type="MatMul" version="opset1"> |
| <data transpose_a="false" transpose_b="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="28" name="Constant_9232_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="1, 1, 2560" offset="13434968" size="5120" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="29" name="Constant_9232" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="30" name="__module.attn/aten::linear/Add_1" type="Add" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="89,q.3"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="31" name="Constant_9687" type="Const" version="opset1"> |
| <data element_type="i64" shape="3" offset="13440088" size="24" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="32" name="__module.attn/aten::view/Reshape_2" type="Reshape" version="opset1"> |
| <data special_zero="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="95"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="33" name="__module.attn/aten::transpose/Constant_1" type="Const" version="opset1"> |
| <data element_type="i32" shape="3" offset="13440112" size="12" /> |
| <output> |
| <port id="0" precision="I32"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="34" name="__module.attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| <port id="1" precision="I32"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="96,q"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>128</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="35" name="Constant_9233_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="1, 1, 1" offset="13440124" size="2" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="36" name="Constant_9233" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="37" name="__module.attn/aten::div/Divide_1" type="Divide" version="opset1"> |
| <data auto_broadcast="numpy" m_pythondiv="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>128</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="118,q_scaled"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>128</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="38" name="self.kv_proj.weight_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="2560, 1152" offset="13440126" size="5898240" /> |
| <output> |
| <port id="0" precision="FP16" names="self.kv_proj.weight"> |
| <dim>2560</dim> |
| <dim>1152</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="39" name="self.kv_proj.weight" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>2560</dim> |
| <dim>1152</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>1152</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="40" name="__module.kv_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> |
| <data transpose_a="false" transpose_b="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>1152</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="41,input.1"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="41" name="__module.ln_kv/aten::layer_norm/Multiply" type="Const" version="opset1"> |
| <data element_type="i32" shape="1" offset="19338366" size="4" /> |
| <output> |
| <port id="0" precision="I32"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="42" name="__module.ln_kv/aten::layer_norm/MVN" type="MVN" version="opset6"> |
| <data eps="9.9999999747524271e-07" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="I32"> |
| <dim>1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="43" name="Constant_9229_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="1, 1, 2560" offset="19338370" size="5120" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="44" name="Constant_9229" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="45" name="__module.ln_kv/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="46" name="Constant_9230_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="1, 1, 2560" offset="19343490" size="5120" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="47" name="Constant_9230" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="48" name="__module.ln_kv/aten::layer_norm/Add" type="Add" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="48"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="49" name="Constant_53" type="Const" version="opset1"> |
| <data element_type="i64" shape="3" offset="19348610" size="24" /> |
| <output> |
| <port id="0" precision="I64" names="20"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="50" name="aten::permute/Transpose" type="Transpose" version="opset1"> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="21,image_feature_1"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="51" name="aten::add/Add" type="Add" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="30,key"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="52" name="__module.attn/prim::ListUnpack/VariadicSplit.1_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="2560, 2560" offset="19348634" size="13107200" /> |
| <output> |
| <port id="0" precision="FP16" names="83,w_k"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="53" name="__module.attn/prim::ListUnpack/VariadicSplit.1" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="54" name="__module.attn/aten::linear/MatMul" type="MatMul" version="opset1"> |
| <data transpose_a="false" transpose_b="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="55" name="Constant_9231_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="1, 1, 2560" offset="32455834" size="5120" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="56" name="Constant_9231" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="57" name="__module.attn/aten::linear/Add" type="Add" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="90,k.1"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="58" name="Constant_9688" type="Const" version="opset1"> |
| <data element_type="i64" shape="3" offset="32460954" size="24" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="59" name="__module.attn/aten::view/Reshape" type="Reshape" version="opset1"> |
| <data special_zero="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="101"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="60" name="__module.attn/aten::transpose/Constant" type="Const" version="opset1"> |
| <data element_type="i32" shape="3" offset="13440112" size="12" /> |
| <output> |
| <port id="0" precision="I32"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="61" name="__module.attn/aten::transpose/Transpose" type="Transpose" version="opset1"> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| <port id="1" precision="I32"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="102,k"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="62" name="__module.attn/aten::baddbmm/MatMul" type="MatMul" version="opset1"> |
| <data transpose_a="false" transpose_b="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>128</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>-1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="63" name="__module.attn/aten::baddbmm/Add" type="Add" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>1</dim> |
| <dim>-1</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>-1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="120,input.5"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>-1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="64" name="__module.attn/aten::softmax/Softmax" type="SoftMax" version="opset8"> |
| <data axis="-1" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>-1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32" names="121,attn_output_weights.1"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>-1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="65" name="__module.attn/prim::ListUnpack/VariadicSplit.2_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="2560, 2560" offset="32460978" size="13107200" /> |
| <output> |
| <port id="0" precision="FP16" names="84,w_v"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="66" name="__module.attn/prim::ListUnpack/VariadicSplit.2" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="67" name="__module.attn/aten::linear/MatMul_2" type="MatMul" version="opset1"> |
| <data transpose_a="false" transpose_b="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="68" name="Constant_9234_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="1, 1, 2560" offset="45568178" size="5120" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="69" name="Constant_9234" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="70" name="__module.attn/aten::linear/Add_2" type="Add" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="91,v.1"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="71" name="Constant_9689" type="Const" version="opset1"> |
| <data element_type="i64" shape="3" offset="32460954" size="24" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="72" name="__module.attn/aten::view/Reshape_3" type="Reshape" version="opset1"> |
| <data special_zero="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="107"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="73" name="__module.attn/aten::transpose/Constant_3" type="Const" version="opset1"> |
| <data element_type="i32" shape="3" offset="13440112" size="12" /> |
| <output> |
| <port id="0" precision="I32"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="74" name="__module.attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| <port id="1" precision="I32"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="108,v"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="75" name="__module.attn/aten::bmm/MatMul" type="MatMul" version="opset1"> |
| <data transpose_a="false" transpose_b="false" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>-1</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>-1</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="122,attn_output.1"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>128</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="76" name="__module.attn/aten::transpose/Constant_4" type="Const" version="opset1"> |
| <data element_type="i32" shape="3" offset="13440112" size="12" /> |
| <output> |
| <port id="0" precision="I32"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="77" name="__module.attn/aten::transpose/Transpose_4" type="Transpose" version="opset1"> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>128</dim> |
| </port> |
| <port id="1" precision="I32"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="123"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="78" name="Concat_4375" type="Const" version="opset1"> |
| <data element_type="i64" shape="2" offset="45573298" size="16" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>2</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="79" name="__module.attn/aten::view/Reshape_4" type="Reshape" version="opset1"> |
| <data special_zero="false" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>128</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>2</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="128"> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="80" name="self.attn.out_proj.weight_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="2560, 2560" offset="45573314" size="13107200" /> |
| <output> |
| <port id="0" precision="FP16" names="self.attn.out_proj.weight"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="81" name="self.attn.out_proj.weight" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="82" name="__module.attn.out_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> |
| <data transpose_a="false" transpose_b="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32"> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="83" name="Constant_9235_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="1, 2560" offset="58680514" size="5120" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="84" name="Constant_9235" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="85" name="__module.attn.out_proj/ov_ext::linear/Add" type="Add" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="131,attn_output"> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="86" name="Constant_9690" type="Const" version="opset1"> |
| <data element_type="i64" shape="3" offset="58685634" size="24" /> |
| <rt_info> |
| <attribute name="precise" version="0" /> |
| </rt_info> |
| <output> |
| <port id="0" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="87" name="__module.attn/aten::view/Reshape_5" type="Reshape" version="opset1"> |
| <data special_zero="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="134,out"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="88" name="Constant_486" type="Const" version="opset1"> |
| <data element_type="i64" shape="3" offset="19348610" size="24" /> |
| <output> |
| <port id="0" precision="I64" names="35"> |
| <dim>3</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="89" name="aten::permute/Transpose_1" type="Transpose" version="opset1"> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>64</dim> |
| <dim>-1</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="I64"> |
| <dim>3</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="36,input"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="90" name="__module.ln_post/aten::layer_norm/Multiply" type="Const" version="opset1"> |
| <data element_type="i32" shape="1" offset="19338366" size="4" /> |
| <output> |
| <port id="0" precision="I32"> |
| <dim>1</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="91" name="__module.ln_post/aten::layer_norm/MVN" type="MVN" version="opset6"> |
| <data eps="9.9999999747524271e-07" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="I32"> |
| <dim>1</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="92" name="Constant_9236_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="1, 1, 2560" offset="58685658" size="5120" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="93" name="Constant_9236" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="94" name="__module.ln_post/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="95" name="Constant_9237_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="1, 1, 2560" offset="58690778" size="5120" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="96" name="Constant_9237" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="97" name="__module.ln_post/aten::layer_norm/Add" type="Add" version="opset1"> |
| <data auto_broadcast="numpy" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>1</dim> |
| <dim>1</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="141,x"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="98" name="Transpose_8047_compressed" type="Const" version="opset1"> |
| <data element_type="f16" shape="2560, 2560" offset="58695898" size="13107200" /> |
| <output> |
| <port id="0" precision="FP16"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="99" name="Transpose_8047" type="Convert" version="opset1"> |
| <data destination_type="f32" /> |
| <rt_info> |
| <attribute name="decompression" version="0" /> |
| </rt_info> |
| <input> |
| <port id="0" precision="FP16"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="100" name="aten::matmul/MatMul" type="MatMul" version="opset1"> |
| <data transpose_a="false" transpose_b="true" /> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| <port id="1" precision="FP32"> |
| <dim>2560</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| <output> |
| <port id="2" precision="FP32" names="last_hidden_state"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| </output> |
| </layer> |
| <layer id="101" name="Result_545" type="Result" version="opset1" output_names="last_hidden_state"> |
| <input> |
| <port id="0" precision="FP32"> |
| <dim>-1</dim> |
| <dim>64</dim> |
| <dim>2560</dim> |
| </port> |
| </input> |
| </layer> |
| </layers> |
| <edges> |
| <edge from-layer="0" from-port="0" to-layer="40" to-port="0" /> |
| <edge from-layer="0" from-port="0" to-layer="7" to-port="0" /> |
| <edge from-layer="1" from-port="0" to-layer="51" to-port="1" /> |
| <edge from-layer="2" from-port="0" to-layer="4" to-port="0" /> |
| <edge from-layer="3" from-port="0" to-layer="4" to-port="1" /> |
| <edge from-layer="4" from-port="2" to-layer="6" to-port="0" /> |
| <edge from-layer="5" from-port="0" to-layer="6" to-port="1" /> |
| <edge from-layer="6" from-port="2" to-layer="18" to-port="0" /> |
| <edge from-layer="7" from-port="1" to-layer="16" to-port="0" /> |
| <edge from-layer="7" from-port="1" to-layer="10" to-port="0" /> |
| <edge from-layer="8" from-port="0" to-layer="10" to-port="1" /> |
| <edge from-layer="9" from-port="0" to-layer="10" to-port="2" /> |
| <edge from-layer="10" from-port="3" to-layer="12" to-port="0" /> |
| <edge from-layer="10" from-port="3" to-layer="23" to-port="1" /> |
| <edge from-layer="11" from-port="0" to-layer="12" to-port="1" /> |
| <edge from-layer="12" from-port="2" to-layer="17" to-port="0" /> |
| <edge from-layer="13" from-port="0" to-layer="17" to-port="1" /> |
| <edge from-layer="14" from-port="0" to-layer="16" to-port="1" /> |
| <edge from-layer="15" from-port="0" to-layer="16" to-port="2" /> |
| <edge from-layer="16" from-port="3" to-layer="17" to-port="2" /> |
| <edge from-layer="17" from-port="3" to-layer="18" to-port="1" /> |
| <edge from-layer="18" from-port="2" to-layer="63" to-port="0" /> |
| <edge from-layer="19" from-port="0" to-layer="20" to-port="0" /> |
| <edge from-layer="20" from-port="1" to-layer="24" to-port="0" /> |
| <edge from-layer="21" from-port="0" to-layer="23" to-port="0" /> |
| <edge from-layer="22" from-port="0" to-layer="23" to-port="2" /> |
| <edge from-layer="23" from-port="3" to-layer="24" to-port="1" /> |
| <edge from-layer="24" from-port="2" to-layer="27" to-port="0" /> |
| <edge from-layer="25" from-port="0" to-layer="26" to-port="0" /> |
| <edge from-layer="26" from-port="1" to-layer="27" to-port="1" /> |
| <edge from-layer="27" from-port="2" to-layer="30" to-port="0" /> |
| <edge from-layer="28" from-port="0" to-layer="29" to-port="0" /> |
| <edge from-layer="29" from-port="1" to-layer="30" to-port="1" /> |
| <edge from-layer="30" from-port="2" to-layer="32" to-port="0" /> |
| <edge from-layer="31" from-port="0" to-layer="32" to-port="1" /> |
| <edge from-layer="32" from-port="2" to-layer="34" to-port="0" /> |
| <edge from-layer="33" from-port="0" to-layer="34" to-port="1" /> |
| <edge from-layer="34" from-port="2" to-layer="37" to-port="0" /> |
| <edge from-layer="35" from-port="0" to-layer="36" to-port="0" /> |
| <edge from-layer="36" from-port="1" to-layer="37" to-port="1" /> |
| <edge from-layer="37" from-port="2" to-layer="62" to-port="0" /> |
| <edge from-layer="38" from-port="0" to-layer="39" to-port="0" /> |
| <edge from-layer="39" from-port="1" to-layer="40" to-port="1" /> |
| <edge from-layer="40" from-port="2" to-layer="42" to-port="0" /> |
| <edge from-layer="41" from-port="0" to-layer="42" to-port="1" /> |
| <edge from-layer="42" from-port="2" to-layer="45" to-port="0" /> |
| <edge from-layer="43" from-port="0" to-layer="44" to-port="0" /> |
| <edge from-layer="44" from-port="1" to-layer="45" to-port="1" /> |
| <edge from-layer="45" from-port="2" to-layer="48" to-port="0" /> |
| <edge from-layer="46" from-port="0" to-layer="47" to-port="0" /> |
| <edge from-layer="47" from-port="1" to-layer="48" to-port="1" /> |
| <edge from-layer="48" from-port="2" to-layer="50" to-port="0" /> |
| <edge from-layer="49" from-port="0" to-layer="50" to-port="1" /> |
| <edge from-layer="50" from-port="2" to-layer="51" to-port="0" /> |
| <edge from-layer="50" from-port="2" to-layer="67" to-port="0" /> |
| <edge from-layer="51" from-port="2" to-layer="54" to-port="0" /> |
| <edge from-layer="52" from-port="0" to-layer="53" to-port="0" /> |
| <edge from-layer="53" from-port="1" to-layer="54" to-port="1" /> |
| <edge from-layer="54" from-port="2" to-layer="57" to-port="0" /> |
| <edge from-layer="55" from-port="0" to-layer="56" to-port="0" /> |
| <edge from-layer="56" from-port="1" to-layer="57" to-port="1" /> |
| <edge from-layer="57" from-port="2" to-layer="59" to-port="0" /> |
| <edge from-layer="58" from-port="0" to-layer="59" to-port="1" /> |
| <edge from-layer="59" from-port="2" to-layer="61" to-port="0" /> |
| <edge from-layer="60" from-port="0" to-layer="61" to-port="1" /> |
| <edge from-layer="61" from-port="2" to-layer="62" to-port="1" /> |
| <edge from-layer="62" from-port="2" to-layer="63" to-port="1" /> |
| <edge from-layer="63" from-port="2" to-layer="64" to-port="0" /> |
| <edge from-layer="64" from-port="1" to-layer="75" to-port="0" /> |
| <edge from-layer="65" from-port="0" to-layer="66" to-port="0" /> |
| <edge from-layer="66" from-port="1" to-layer="67" to-port="1" /> |
| <edge from-layer="67" from-port="2" to-layer="70" to-port="0" /> |
| <edge from-layer="68" from-port="0" to-layer="69" to-port="0" /> |
| <edge from-layer="69" from-port="1" to-layer="70" to-port="1" /> |
| <edge from-layer="70" from-port="2" to-layer="72" to-port="0" /> |
| <edge from-layer="71" from-port="0" to-layer="72" to-port="1" /> |
| <edge from-layer="72" from-port="2" to-layer="74" to-port="0" /> |
| <edge from-layer="73" from-port="0" to-layer="74" to-port="1" /> |
| <edge from-layer="74" from-port="2" to-layer="75" to-port="1" /> |
| <edge from-layer="75" from-port="2" to-layer="77" to-port="0" /> |
| <edge from-layer="76" from-port="0" to-layer="77" to-port="1" /> |
| <edge from-layer="77" from-port="2" to-layer="79" to-port="0" /> |
| <edge from-layer="78" from-port="0" to-layer="79" to-port="1" /> |
| <edge from-layer="79" from-port="2" to-layer="82" to-port="0" /> |
| <edge from-layer="80" from-port="0" to-layer="81" to-port="0" /> |
| <edge from-layer="81" from-port="1" to-layer="82" to-port="1" /> |
| <edge from-layer="82" from-port="2" to-layer="85" to-port="0" /> |
| <edge from-layer="83" from-port="0" to-layer="84" to-port="0" /> |
| <edge from-layer="84" from-port="1" to-layer="85" to-port="1" /> |
| <edge from-layer="85" from-port="2" to-layer="87" to-port="0" /> |
| <edge from-layer="86" from-port="0" to-layer="87" to-port="1" /> |
| <edge from-layer="87" from-port="2" to-layer="89" to-port="0" /> |
| <edge from-layer="88" from-port="0" to-layer="89" to-port="1" /> |
| <edge from-layer="89" from-port="2" to-layer="91" to-port="0" /> |
| <edge from-layer="90" from-port="0" to-layer="91" to-port="1" /> |
| <edge from-layer="91" from-port="2" to-layer="94" to-port="0" /> |
| <edge from-layer="92" from-port="0" to-layer="93" to-port="0" /> |
| <edge from-layer="93" from-port="1" to-layer="94" to-port="1" /> |
| <edge from-layer="94" from-port="2" to-layer="97" to-port="0" /> |
| <edge from-layer="95" from-port="0" to-layer="96" to-port="0" /> |
| <edge from-layer="96" from-port="1" to-layer="97" to-port="1" /> |
| <edge from-layer="97" from-port="2" to-layer="100" to-port="0" /> |
| <edge from-layer="98" from-port="0" to-layer="99" to-port="0" /> |
| <edge from-layer="99" from-port="1" to-layer="100" to-port="1" /> |
| <edge from-layer="100" from-port="2" to-layer="101" to-port="0" /> |
| </edges> |
| <rt_info> |
| <Runtime_version value="2026.0.0-20965-c6d6a13a886-releases/2026/0" /> |
| <conversion_parameters> |
| <framework value="pytorch" /> |
| <is_python_object value="True" /> |
| </conversion_parameters> |
| <optimum> |
| <optimum_intel_version value="1.27.0" /> |
| <optimum_version value="2.1.0" /> |
| <pytorch_version value="2.11.0" /> |
| <transformers_version value="4.57.6" /> |
| </optimum> |
| </rt_info> |
| </net> |
|
|