<?xml version="1.0"?> <net name="Model124" version="11"> <layers> <layer id="3" name="input_ids" type="Parameter" version="opset1"> <data shape="?,?" element_type="i64" /> <output> <port id="0" precision="I64" names="input_ids"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2" name="attention_mask" type="Parameter" version="opset1"> <data shape="?,?" element_type="i64" /> <output> <port id="0" precision="I64" names="attention_mask"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1" name="position_ids" type="Parameter" version="opset1"> <data shape="?,?" element_type="i64" /> <output> <port id="0" precision="I64" names="position_ids"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="0" name="beam_idx" type="Parameter" version="opset1"> <data shape="?" element_type="i32" /> <output> <port id="0" precision="I32" names="beam_idx"> <dim>-1</dim> </port> </output> </layer> <layer id="4" name="Constant_1190680" type="Const" version="opset1"> <data element_type="f32" shape="" offset="0" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="5" name="ShapeOf_1190666" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="6" name="Constant_1190668" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="7" name="Constant_1190670" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="8" name="Gather_1190671" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="9" name="Constant_1190673" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="10" name="Constant_1190675" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="11" name="Constant_1190677" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="20" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="12" name="Concat_1190678" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="13" name="Broadcast_1190681" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </output> </layer> <layer id="14" name="ReadValue_1190218" type="ReadValue" version="opset6"> <data variable_id="past_key_values.9.valuepresent.9.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.9.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="15" name="Constant_1189432" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="16" name="Gather_1189433" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="17" name="Constant_1175925" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="28" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="18" name="self.model.embed_tokens.weight" type="Const" version="opset1"> <data element_type="u8" shape="131072, 3072" offset="12316" size="402653184" /> <output> <port id="0" precision="U8"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="19" name="Convert_1228322" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>131072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="20" name="self.model.embed_tokens.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="131072, 1" offset="402665500" size="131072" /> <output> <port id="0" precision="U8"> <dim>131072</dim> <dim>1</dim> </port> </output> </layer> <layer id="21" name="Convert_1228325" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>131072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>131072</dim> <dim>1</dim> </port> </output> </layer> <layer id="22" name="self.model.embed_tokens.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>131072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="23" name="self.model.embed_tokens.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="131072, 1" offset="402796572" size="262144" /> <output> <port id="0" precision="FP16"> <dim>131072</dim> <dim>1</dim> </port> </output> </layer> <layer id="24" name="self.model.embed_tokens.weight/fq_weights_0" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>131072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="25" name="__module.model.embed_tokens/ov_ext::embedding/Convert" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="26" name="__module.model.embed_tokens/ov_ext::embedding/Convert_1" type="Convert" version="opset1"> <data destination_type="i32" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I32"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="27" name="__module.model.embed_tokens/ov_ext::embedding/Constant" type="Const" version="opset1"> <data element_type="i32" shape="" offset="0" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="28" name="__module.model.embed_tokens/ov_ext::embedding/Gather" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>131072</dim> <dim>3072</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="FP32" names="373,456,467,hidden_states.1,inputs_embeds"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="29" name="Constant_1175834" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="403058716" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="30" name="Constant_1175833" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="31" name="Constant_1175831" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="32" name="__module.model.layers.0.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="457"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="33" name="Constant_1081854" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="458"> <dim>1</dim> </port> </output> </layer> <layer id="34" name="__module.model.layers.0.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="459,variance.1"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="35" name="Constant_1175832" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="36" name="__module.model.layers.0.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="460"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="37" name="__module.model.layers.0.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="38" name="__module.model.layers.0.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="461"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="39" name="__module.model.layers.0.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="462,463,hidden_states.3,hidden_states.5"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="40" name="__module.model.layers.0.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="464,466,hidden_states.7"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="41" name="self.model.layers.0.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="403071024" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="42" name="Convert_1229542" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="43" name="self.model.layers.0.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="412508208" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="44" name="Convert_1229545" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="45" name="self.model.layers.0.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="46" name="self.model.layers.0.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="412511280" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="47" name="self.model.layers.0.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="48" name="__module.model.layers.0.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="49" name="__module.model.layers.0.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="475,query_states.1"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="50" name="Constant_1187717" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="51" name="__module.model.layers.0.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="481"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="52" name="__module.model.layers.0.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="53" name="__module.model.layers.0.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="482,q.1"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="54" name="__module.model.rotary_emb/aten::unsqueeze/Unsqueeze_1" type="Const" version="opset1"> <data element_type="f32" shape="1, 128, 1" offset="412517472" size="512" /> <output> <port id="0" precision="FP32" names="427,428"> <dim>1</dim> <dim>128</dim> <dim>1</dim> </port> </output> </layer> <layer id="55" name="ShapeOf_1178349" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="56" name="Constant_1178350" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="57" name="Constant_1178351" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="58" name="Gather_1178352" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>3</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="1008,1146,1162,1300,1316,1454,1470,1608,1624,1762,1778,1916,1932,2070,2086,2224,2240,2378,2394,2532,2548,2686,2702,2840,2856,2994,3010,3148,3164,3302,3318,3456,3472,3610,3626,3764,3780,3918,3934,399,4072,4088,4226,4242,429,4380,4396,4534,4550,4688,4704,4842,4858,4996,5012,5150,5166,530,5304,5320,5458,546,5474,5612,5628,5766,5782,5920,5936,6074,6090,6228,6244,6382,6398,6536,6552,684,700,838,854,992"> <dim>1</dim> </port> </output> </layer> <layer id="59" name="Constant_1166378" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="60" name="Constant_1166380" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="61" name="__module.model.rotary_emb/prim::ListConstruct" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="3" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="62" name="__module.model.rotary_emb/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>128</dim> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="431,436,inv_freq_expanded,inv_freq_expanded.1"> <dim>-1</dim> <dim>128</dim> <dim>1</dim> </port> </output> </layer> <layer id="63" name="286" type="Const" version="opset1"> <data element_type="i64" shape="" offset="412517984" size="8" /> <output> <port id="0" precision="I64" names="286" /> </output> </layer> <layer id="64" name="__module.model.rotary_emb/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="433,434"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="65" name="__module.model.rotary_emb/aten::to/Convert_2" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="FP32" names="435,437,position_ids_expanded,position_ids_expanded.1"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="66" name="__module.model.rotary_emb/aten::matmul/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>128</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </input> <output> <port id="2" precision="FP32" names="438"> <dim>-1</dim> <dim>128</dim> <dim>-1</dim> </port> </output> </layer> <layer id="67" name="__module.model.rotary_emb/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="3" offset="412517992" size="12" /> <output> <port id="0" precision="I32"> <dim>3</dim> </port> </output> </layer> <layer id="68" name="__module.model.rotary_emb/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>128</dim> <dim>-1</dim> </port> <port id="1" precision="I32"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="439"> <dim>-1</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="69" name="__module.model.rotary_emb/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="441,emb"> <dim>-1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="70" name="__module.model.rotary_emb/aten::cos/Cos" type="Cos" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="442,444,446,449,cos.1,cos.3,cos.5"> <dim>-1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="71" name="__module.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1108,1262,1416,1570,1724,1878,2032,2186,2340,2494,2648,2802,2956,3110,3264,3418,3572,3726,3880,4034,4188,4342,4496,4650,4804,489,4958,5112,5266,5420,5574,5728,5882,6036,6190,6344,646,6498,800,954,cos,cos.11,cos.13,cos.15,cos.17,cos.19,cos.21,cos.23,cos.25,cos.27,cos.29,cos.31,cos.33,cos.35,cos.37,cos.39,cos.41,cos.43,cos.45,cos.47,cos.49,cos.51,cos.53,cos.55,cos.57,cos.59,cos.61,cos.63,cos.65,cos.67,cos.69,cos.7,cos.71,cos.73,cos.75,cos.77,cos.79,cos.81,cos.83,cos.9"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="72" name="__module.model.layers.0.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="491"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="73" name="Constant_1082251" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="74" name="Constant_1082253" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="75" name="Constant_1082255" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="76" name="__module.model.layers.0.self_attn/aten::slice/Reshape" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518020" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="77" name="__module.model.layers.0.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="501,x2.1"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="78" name="Constant_1175835" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="79" name="__module.model.layers.0.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="502"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="80" name="Constant_1082148" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="81" name="Constant_1082192" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="82" name="Constant_1082194" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="83" name="__module.model.layers.0.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="496"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="84" name="__module.model.layers.0.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="504"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="85" name="__module.model.rotary_emb/aten::sin/Sin" type="Sin" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="443,445,447,450,sin.1,sin.3,sin.5"> <dim>-1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="86" name="__module.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1109,1263,1417,1571,1725,1879,2033,2187,2341,2495,2649,2803,2957,3111,3265,3419,3573,3727,3881,4035,4189,4343,4497,4651,4805,490,4959,5113,5267,5421,5575,5729,5883,6037,6191,6345,647,6499,801,955,sin,sin.11,sin.13,sin.15,sin.17,sin.19,sin.21,sin.23,sin.25,sin.27,sin.29,sin.31,sin.33,sin.35,sin.37,sin.39,sin.41,sin.43,sin.45,sin.47,sin.49,sin.51,sin.53,sin.55,sin.57,sin.59,sin.61,sin.63,sin.65,sin.67,sin.69,sin.7,sin.71,sin.73,sin.75,sin.77,sin.79,sin.81,sin.83,sin.9"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="87" name="__module.model.layers.0.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="505"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="88" name="__module.model.layers.0.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="506"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="89" name="ReadValue_1190060" type="ReadValue" version="opset6"> <data variable_id="past_key_values.0.keypresent.0.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.0.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="90" name="Constant_1189375" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="91" name="Gather_1189376" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="92" name="self.model.layers.0.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="412518032" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="93" name="Convert_1230342" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="94" name="self.model.layers.0.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="415663760" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="95" name="Convert_1230345" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="96" name="self.model.layers.0.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="97" name="self.model.layers.0.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="415664784" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="98" name="self.model.layers.0.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="99" name="__module.model.layers.0.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="100" name="__module.model.layers.0.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="477,key_states.3"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="101" name="Constant_1187718" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="102" name="__module.model.layers.0.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="484"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="103" name="__module.model.layers.0.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="104" name="__module.model.layers.0.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="485,k.1"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="105" name="__module.model.layers.0.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="507"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="106" name="Constant_1082394" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="107" name="Constant_1082396" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="108" name="Constant_1082398" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="109" name="__module.model.layers.0.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="517,x2.3"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="110" name="Constant_1175836" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="111" name="__module.model.layers.0.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="518"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="112" name="Constant_1082291" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="113" name="Constant_1082335" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="114" name="Constant_1082337" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="115" name="__module.model.layers.0.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="512"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="116" name="__module.model.layers.0.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="520"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="117" name="__module.model.layers.0.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="521"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="118" name="__module.model.layers.0.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="522,key_states.5"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="119" name="__module.model.layers.0.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="535,536,hidden_states.9,present.0.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="120" name="288" type="Const" version="opset1"> <data element_type="i64" shape="" offset="415666864" size="8" /> <output> <port id="0" precision="I64" names="288" /> </output> </layer> <layer id="121" name="__module.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="537,538,539"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="122" name="__module.model.layers.0.self_attn/aten::size/ShapeOf_2" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="123" name="Constant_1169148" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="415666872" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="124" name="Constant_1169149" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="125" name="Gather_1169150" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>4</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="126" name="Constant_1166387" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518020" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="127" name="ShapeOf_1178391" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="128" name="Constant_1178392" type="Const" version="opset1"> <data element_type="i64" shape="" offset="415666864" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="129" name="Constant_1178393" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="130" name="Gather_1178394" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>4</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="377" /> </output> </layer> <layer id="131" name="Constant_1226953" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="132" name="Reshape_1178406" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="133" name="Constant_1178360" type="Const" version="opset1"> <data element_type="i64" shape="" offset="412517984" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="134" name="Constant_1178361" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="135" name="Gather_1178362" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>3</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="379,384" /> </output> </layer> <layer id="136" name="Constant_1226954" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="137" name="Reshape_1178408" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="138" name="Add_1178409" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64" names="1024,1149,1178,1303,1332,1457,1486,1611,1640,1765,1794,1919,1948,2073,2102,2227,2256,2381,2410,2535,2564,2689,2718,2843,2872,2997,3026,3151,3180,3305,3334,3459,3488,3613,3642,3767,3796,3921,3950,4075,4104,4229,4258,4383,4412,4537,4566,4691,4720,4845,4874,4999,5028,5153,5182,5307,533,5336,5461,5490,5615,562,5644,5769,5798,5923,5952,6077,6106,6231,6260,6385,6414,6539,6568,687,716,841,870,995"> <dim>1</dim> </port> </output> </layer> <layer id="139" name="Constant_1166390" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="20" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="140" name="__module.model.layers.0.self_attn/prim::ListConstruct_2" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>5</dim> </port> </output> </layer> <layer id="141" name="__module.model.layers.0.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="541,hidden_states.11"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="142" name="Constant_1187719" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="143" name="__module.model.layers.0.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="545,key_states.7"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="144" name="ReadValue_1190062" type="ReadValue" version="opset6"> <data variable_id="past_key_values.0.valuepresent.0.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.0.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="145" name="Constant_1189378" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="146" name="Gather_1189379" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="147" name="self.model.layers.0.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="415666920" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="148" name="Convert_1230352" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="149" name="self.model.layers.0.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="418812648" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="150" name="Convert_1230355" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="151" name="self.model.layers.0.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="152" name="self.model.layers.0.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="418813672" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="153" name="self.model.layers.0.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="154" name="__module.model.layers.0.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="155" name="__module.model.layers.0.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="479,value_states.1"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="156" name="Constant_1187720" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="157" name="__module.model.layers.0.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="487"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="158" name="__module.model.layers.0.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="159" name="__module.model.layers.0.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="488"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="160" name="__module.model.layers.0.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="551,552,hidden_states.13,present.0.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="161" name="__module.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="553,554,555"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="162" name="__module.model.layers.0.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="557,hidden_states.15"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="163" name="Constant_1187721" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="164" name="__module.model.layers.0.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="561"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="165" name="__module.model/aten::triu/Constant" type="Const" version="opset1"> <data element_type="i32" shape="" offset="0" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="166" name="Multiply_1170288" type="Const" version="opset1"> <data element_type="f32" shape="" offset="418815720" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="167" name="Constant_1170293" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="418815724" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="168" name="ShapeOf_1178367" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="169" name="Constant_1178368" type="Const" version="opset1"> <data element_type="i64" shape="" offset="412517984" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="170" name="Constant_1178369" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="171" name="Gather_1178370" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="385,403" /> </output> </layer> <layer id="172" name="Constant_1226955" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="173" name="Reshape_1178372" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="174" name="__module.model/prim::ListConstruct" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="175" name="Maximum_1170294" type="Maximum" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="176" name="__module.model/aten::mul/Multiply" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP32" names="388"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="177" name="ShapeOf_1178377" type="ShapeOf" version="opset3"> <data output_type="i32" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I32"> <dim>2</dim> </port> </output> </layer> <layer id="178" name="Constant_1178378" type="Const" version="opset1"> <data element_type="i64" shape="" offset="412517984" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="179" name="Constant_1178379" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="180" name="Gather_1178380" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I32"> <dim>2</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I32" /> </output> </layer> <layer id="181" name="__module.model/aten::triu/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="" offset="418815740" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="182" name="__module.model/aten::triu/Range" type="Range" version="opset4"> <data output_type="i32" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32" /> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="I32"> <dim>-1</dim> </port> </output> </layer> <layer id="183" name="__module.model/aten::triu/Unsqueeze" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I32"> <dim>-1</dim> </port> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I32"> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="184" name="__module.model/aten::triu/Convert" type="Const" version="opset1"> <data element_type="i32" shape="" offset="418815740" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="185" name="Constant_1178384" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="186" name="Constant_1178385" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="187" name="Gather_1178386" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I32"> <dim>2</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I32" /> </output> </layer> <layer id="188" name="__module.model/aten::triu/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I32" /> </output> </layer> <layer id="189" name="__module.model/aten::triu/Range_1" type="Range" version="opset4"> <data output_type="i32" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32" /> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="I32"> <dim>-1</dim> </port> </output> </layer> <layer id="190" name="__module.model/aten::triu/Unsqueeze_1" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I32"> <dim>-1</dim> </port> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I32"> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="191" name="__module.model/aten::triu/GreaterEqual" type="GreaterEqual" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I32"> <dim>1</dim> <dim>-1</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="BOOL"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="192" name="__module.model/aten::triu/ConvertLike" type="Const" version="opset1"> <data element_type="f32" shape="" offset="0" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="193" name="__module.model/aten::triu/Select" type="Select" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="BOOL"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="2" precision="FP32" /> </input> <output> <port id="3" precision="FP32" names="389_1"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="194" name="__module.model/aten::arange/Constant" type="Const" version="opset1"> <data element_type="i32" shape="" offset="0" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="195" name="__module.model/aten::arange/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="" offset="418815740" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="196" name="__module.model/aten::arange/Range" type="Range" version="opset4"> <data output_type="f32" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I64" /> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> </port> </output> </layer> <layer id="197" name="__module.model/aten::arange/ConvertLike" type="Convert" version="opset1"> <data destination_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64" names="390"> <dim>-1</dim> </port> </output> </layer> <layer id="198" name="__module.model/aten::gt/Convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="I64"> <dim>-1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> </port> </output> </layer> <layer id="199" name="__module.model/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="381" /> </output> </layer> <layer id="200" name="__module.model/aten::arange/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="" offset="418815740" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="201" name="__module.model/aten::arange/Range_1" type="Range" version="opset4"> <data output_type="f32" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64" /> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="FP32" names="383,cache_position"> <dim>-1</dim> </port> </output> </layer> <layer id="202" name="Constant_1081462" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="418815744" size="16" /> <output> <port id="0" precision="I64" names="391"> <dim>2</dim> </port> </output> </layer> <layer id="203" name="__module.model/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP32" names="392"> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="204" name="__module.model/aten::gt/Greater" type="Greater" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="BOOL" names="393"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="205" name="__module.model/aten::mul_/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="BOOL"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="206" name="__module.model/aten::mul_/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="2" precision="FP32" names="389,causal_mask.1"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="207" name="279" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" names="279" /> </output> </layer> <layer id="208" name="__module.model/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="395"> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="209" name="__module.model/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="396,397,398"> <dim>1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="210" name="Constant_1166418" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="211" name="Constant_1166420" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="212" name="Constant_1166422" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="213" name="__module.model/prim::ListConstruct_1" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="214" name="__module.model/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="401,404,405,406,414,415,416,419_1,420_1,421_1,causal_mask.5"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="215" name="Constant_1226956" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="216" name="SliceAssign_1081679/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> </port> </output> </layer> <layer id="217" name="Constant_1131614" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="218" name="SliceAssign_1081679/ShapeOf" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="219" name="SliceAssign_1081679/ReduceProd" type="ReduceProd" version="opset1"> <data keep_dims="false" /> <input> <port id="0" precision="I64"> <dim>4</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" /> </output> </layer> <layer id="220" name="Constant_1131615" type="Const" version="opset1"> <data element_type="i64" shape="" offset="412517984" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="221" name="SliceAssign_1081679/Range" type="Range" version="opset4"> <data output_type="i64" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64"> <dim>-1</dim> </port> </output> </layer> <layer id="222" name="SliceAssign_1081679/Reshape" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64"> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="223" name="Constant_1081668" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="224" name="Constant_1081671" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="225" name="SliceAssign_1081679/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="226" name="Constant_1131617" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="418815744" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="227" name="SliceAssign_1081679/Reshape_4" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="228" name="Constant_1081551" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="229" name="Constant_1081554" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="230" name="__module.model/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="407,417,422_1"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="231" name="__module.model/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="409"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="232" name="__module.model/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="410,411"> <dim>-1</dim> <dim>1</dim> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="233" name="__module.model/aten::add/Convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="234" name="__module.model/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>1</dim> <dim>-1</dim> </port> </input> <output> <port id="2" precision="FP32" names="412,padding_mask.1"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="235" name="Constant_1175837" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="0" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="236" name="__module.model/aten::eq/Equal" type="Equal" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="BOOL" names="413,padding_mask"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="237" name="276" type="Const" version="opset1"> <data element_type="f32" shape="" offset="418815720" size="4" /> <output> <port id="0" precision="FP32" names="276" /> </output> </layer> <layer id="238" name="__module.model/aten::masked_fill/Select" type="Select" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="BOOL"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32" /> <port id="2" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="3" precision="FP32" names="418"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="239" name="__module.model/aten::copy_/ShapeOf" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="240" name="__module.model/aten::copy_/Broadcast" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="422"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="241" name="Constant_1226957" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="242" name="SliceAssign_1081679/Reshape_5" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> </port> </output> </layer> <layer id="243" name="SliceAssign_1081679/ScatterNDUpdate" type="ScatterNDUpdate" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>-1</dim> <dim>1</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> </port> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> </port> </output> </layer> <layer id="244" name="SliceAssign_1081679/Reshape_6" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1025,1026,1027,1179,1180,1181,1333,1334,1335,1487,1488,1489,1641,1642,1643,1795,1796,1797,1949,1950,1951,2103,2104,2105,2257,2258,2259,2411,2412,2413,2565,2566,2567,2719,2720,2721,2873,2874,2875,3027,3028,3029,3181,3182,3183,3335,3336,3337,3489,3490,3491,3643,3644,3645,3797,3798,3799,3951,3952,3953,402,4105,4106,4107,4259,4260,4261,4413,4414,4415,4567,4568,4569,4721,4722,4723,4875,4876,4877,5029,5030,5031,5183,5184,5185,5337,5338,5339,5491,5492,5493,563,564,5645,5646,5647,565,5799,5800,5801,5953,5954,5955,6107,6108,6109,6261,6262,6263,6415,6416,6417,6569,6570,6571,717,718,719,871,872,873"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="245" name="Constant_1082898" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="246" name="Constant_1082901" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="247" name="__module.model.layers.0.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1028,1182,1336,1490,1644,1798,1952,2106,2260,2414,2568,2722,2876,3030,3184,3338,3492,3646,3800,3954,4108,4262,4416,4570,4724,4878,5032,5186,5340,5494,5648,566,5802,5956,6110,6264,6418,6572,720,874"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="248" name="__module.model.layers.0.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="567,attn_output.1"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="249" name="__module.model.layers.0.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="250" name="__module.model.layers.0.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="568"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="251" name="Constant_1169143" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="415666872" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="252" name="Constant_1169144" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="253" name="Gather_1169145" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>3</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="254" name="Constant_1082975" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="255" name="__module.model.layers.0.self_attn/prim::ListConstruct_7" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="256" name="__module.model.layers.0.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="571"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="257" name="self.model.layers.0.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="418815760" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="258" name="Convert_1229552" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="259" name="self.model.layers.0.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="428252944" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="260" name="Convert_1229555" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="261" name="self.model.layers.0.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="262" name="self.model.layers.0.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="428256016" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="263" name="self.model.layers.0.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="264" name="__module.model.layers.0.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="265" name="__module.model.layers.0.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="573,575,hidden_states.17"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="266" name="__module.model.layers.0/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="578,580,591,hidden_states.19,hidden_states.21"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="267" name="Constant_1175841" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="428262160" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="268" name="Constant_1175840" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="269" name="Constant_1175838" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="270" name="__module.model.layers.0.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="581"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="271" name="Constant_1083003" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="582"> <dim>1</dim> </port> </output> </layer> <layer id="272" name="__module.model.layers.0.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="583,variance.3"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="273" name="Constant_1175839" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="274" name="__module.model.layers.0.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="584"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="275" name="__module.model.layers.0.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="276" name="__module.model.layers.0.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="585"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="277" name="__module.model.layers.0.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="586,587,hidden_states.23,hidden_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="278" name="__module.model.layers.0.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="588,590"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="279" name="self.model.layers.0.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="428274448" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="280" name="Convert_1228352" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="281" name="self.model.layers.0.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="499053328" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="282" name="Convert_1228355" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="283" name="self.model.layers.0.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="284" name="self.model.layers.0.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="499076368" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="285" name="self.model.layers.0.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="286" name="__module.model.layers.0.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="287" name="__module.model.layers.0.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="596,input.1"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="288" name="__module.model.layers.0.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="597"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="289" name="self.model.layers.0.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="499122448" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="290" name="Convert_1228342" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="291" name="self.model.layers.0.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="569901328" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="292" name="Convert_1228345" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="293" name="self.model.layers.0.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="294" name="self.model.layers.0.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="569924368" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="295" name="self.model.layers.0.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="296" name="__module.model.layers.0.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="297" name="__module.model.layers.0.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="599"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="298" name="__module.model.layers.0.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="600"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="299" name="self.model.layers.0.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="569970448" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="300" name="Convert_1228362" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="301" name="self.model.layers.0.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="640749328" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="302" name="Convert_1228365" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="303" name="self.model.layers.0.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="304" name="self.model.layers.0.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="640752400" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="305" name="self.model.layers.0.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="306" name="__module.model.layers.0.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="307" name="__module.model.layers.0.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="602,hidden_states.27"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="308" name="__module.model.layers.0/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="603,605,613,624,hidden_states.29,hidden_states.31"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="309" name="Constant_1175845" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="640758544" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="310" name="Constant_1175844" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="311" name="Constant_1175842" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="312" name="__module.model.layers.1.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="614"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="313" name="Constant_1083077" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="615"> <dim>1</dim> </port> </output> </layer> <layer id="314" name="__module.model.layers.1.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="616,variance.5"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="315" name="Constant_1175843" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="316" name="__module.model.layers.1.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="617"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="317" name="__module.model.layers.1.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="318" name="__module.model.layers.1.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="618"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="319" name="__module.model.layers.1.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="619,620,hidden_states.33,hidden_states.35"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="320" name="__module.model.layers.1.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="621,623,hidden_states.37"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="321" name="self.model.layers.1.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="640770832" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="322" name="Convert_1229562" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="323" name="self.model.layers.1.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="650208016" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="324" name="Convert_1229565" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="325" name="self.model.layers.1.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="326" name="self.model.layers.1.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="650211088" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="327" name="self.model.layers.1.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="328" name="__module.model.layers.1.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="329" name="__module.model.layers.1.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="632,query_states.3"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="330" name="Constant_1187722" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="331" name="__module.model.layers.1.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="638"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="332" name="__module.model.layers.1.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="333" name="__module.model.layers.1.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="639,q.3"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="334" name="__module.model.layers.1.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="648"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="335" name="Constant_1083474" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="336" name="Constant_1083476" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="337" name="Constant_1083478" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="338" name="__module.model.layers.1.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="658,x2.5"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="339" name="Constant_1175846" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="340" name="__module.model.layers.1.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="659"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="341" name="Constant_1083371" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="342" name="Constant_1083415" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="343" name="Constant_1083417" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="344" name="__module.model.layers.1.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="653"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="345" name="__module.model.layers.1.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="661"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="346" name="__module.model.layers.1.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="662"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="347" name="__module.model.layers.1.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="663"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="348" name="ReadValue_1190064" type="ReadValue" version="opset6"> <data variable_id="past_key_values.1.keypresent.1.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.1.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="349" name="Constant_1189381" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="350" name="Gather_1189382" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="351" name="self.model.layers.1.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="650217232" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="352" name="Convert_1230372" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="353" name="self.model.layers.1.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="653362960" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="354" name="Convert_1230375" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="355" name="self.model.layers.1.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="356" name="self.model.layers.1.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="653363984" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="357" name="self.model.layers.1.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="358" name="__module.model.layers.1.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="359" name="__module.model.layers.1.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="634,key_states.9"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="360" name="Constant_1187723" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="361" name="__module.model.layers.1.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="641"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="362" name="__module.model.layers.1.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="363" name="__module.model.layers.1.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="642,k.3"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="364" name="__module.model.layers.1.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="664"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="365" name="Constant_1083617" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="366" name="Constant_1083619" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="367" name="Constant_1083621" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="368" name="__module.model.layers.1.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="674,x2.7"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="369" name="Constant_1175847" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="370" name="__module.model.layers.1.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="675"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="371" name="Constant_1083514" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="372" name="Constant_1083558" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="373" name="Constant_1083560" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="374" name="__module.model.layers.1.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="669"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="375" name="__module.model.layers.1.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="677"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="376" name="__module.model.layers.1.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="678"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="377" name="__module.model.layers.1.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="679"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="378" name="__module.model.layers.1.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="689,690,hidden_states.39,present.1.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="379" name="__module.model.layers.1.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="691,692,693"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="380" name="__module.model.layers.1.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="695,hidden_states.41"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="381" name="Constant_1187724" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="382" name="__module.model.layers.1.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="699,key_states.11"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="383" name="ReadValue_1190066" type="ReadValue" version="opset6"> <data variable_id="past_key_values.1.valuepresent.1.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.1.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="384" name="Constant_1189384" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="385" name="Gather_1189385" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="386" name="self.model.layers.1.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="653366032" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="387" name="Convert_1230362" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="388" name="self.model.layers.1.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="656511760" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="389" name="Convert_1230365" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="390" name="self.model.layers.1.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="391" name="self.model.layers.1.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="656512784" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="392" name="self.model.layers.1.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="393" name="__module.model.layers.1.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="394" name="__module.model.layers.1.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="636,value_states.3"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="395" name="Constant_1187725" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="396" name="__module.model.layers.1.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="644"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="397" name="__module.model.layers.1.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="398" name="__module.model.layers.1.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="645"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="399" name="__module.model.layers.1.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="705,706,hidden_states.43,present.1.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="400" name="__module.model.layers.1.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="707,708,709"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="401" name="__module.model.layers.1.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="711,hidden_states.45"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="402" name="Constant_1187726" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="403" name="__module.model.layers.1.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="715"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="404" name="__module.model.layers.1.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="721,attn_output.5"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="405" name="__module.model.layers.1.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="406" name="__module.model.layers.1.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="722"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="407" name="__module.model.layers.1.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="725"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="408" name="self.model.layers.1.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="656514832" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="409" name="Convert_1229572" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="410" name="self.model.layers.1.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="665952016" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="411" name="Convert_1229575" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="412" name="self.model.layers.1.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="413" name="self.model.layers.1.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="665955088" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="414" name="self.model.layers.1.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="415" name="__module.model.layers.1.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="416" name="__module.model.layers.1.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="727,729,hidden_states.47"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="417" name="__module.model.layers.1/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="732,734,745,hidden_states.49,hidden_states.51"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="418" name="Constant_1175851" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="665961232" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="419" name="Constant_1175850" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="420" name="Constant_1175848" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="421" name="__module.model.layers.1.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="735"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="422" name="Constant_1084220" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="736"> <dim>1</dim> </port> </output> </layer> <layer id="423" name="__module.model.layers.1.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="737,variance.7"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="424" name="Constant_1175849" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="425" name="__module.model.layers.1.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="738"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="426" name="__module.model.layers.1.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="427" name="__module.model.layers.1.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="739"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="428" name="__module.model.layers.1.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="740,741,hidden_states.53,hidden_states.55"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="429" name="__module.model.layers.1.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="742,744"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="430" name="self.model.layers.1.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="665973520" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="431" name="Convert_1228382" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="432" name="self.model.layers.1.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="736752400" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="433" name="Convert_1228385" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="434" name="self.model.layers.1.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="435" name="self.model.layers.1.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="736775440" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="436" name="self.model.layers.1.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="437" name="__module.model.layers.1.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="438" name="__module.model.layers.1.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="750,input.3"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="439" name="__module.model.layers.1.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="751"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="440" name="self.model.layers.1.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="736821520" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="441" name="Convert_1228372" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="442" name="self.model.layers.1.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="807600400" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="443" name="Convert_1228375" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="444" name="self.model.layers.1.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="445" name="self.model.layers.1.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="807623440" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="446" name="self.model.layers.1.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="447" name="__module.model.layers.1.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="448" name="__module.model.layers.1.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="753"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="449" name="__module.model.layers.1.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="754"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="450" name="self.model.layers.1.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="807669520" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="451" name="Convert_1228392" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="452" name="self.model.layers.1.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="878448400" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="453" name="Convert_1228395" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="454" name="self.model.layers.1.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="455" name="self.model.layers.1.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="878451472" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="456" name="self.model.layers.1.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="457" name="__module.model.layers.1.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="458" name="__module.model.layers.1.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="756,hidden_states.57"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="459" name="__module.model.layers.1/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="757,759,767,778,hidden_states.59,hidden_states.61"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="460" name="Constant_1175855" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="878457616" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="461" name="Constant_1175854" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="462" name="Constant_1175852" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="463" name="__module.model.layers.2.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="768"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="464" name="Constant_1084294" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="769"> <dim>1</dim> </port> </output> </layer> <layer id="465" name="__module.model.layers.2.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="770,variance.9"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="466" name="Constant_1175853" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="467" name="__module.model.layers.2.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="771"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="468" name="__module.model.layers.2.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="469" name="__module.model.layers.2.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="772"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="470" name="__module.model.layers.2.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="773,774,hidden_states.63,hidden_states.65"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="471" name="__module.model.layers.2.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="775,777,hidden_states.67"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="472" name="self.model.layers.2.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="878469904" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="473" name="Convert_1229582" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="474" name="self.model.layers.2.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="887907088" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="475" name="Convert_1229585" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="476" name="self.model.layers.2.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="477" name="self.model.layers.2.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="887910160" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="478" name="self.model.layers.2.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="479" name="__module.model.layers.2.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="480" name="__module.model.layers.2.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="786,query_states.5"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="481" name="Constant_1187727" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="482" name="__module.model.layers.2.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="792"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="483" name="__module.model.layers.2.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="484" name="__module.model.layers.2.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="793,q.5"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="485" name="__module.model.layers.2.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="802"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="486" name="Constant_1084691" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="487" name="Constant_1084693" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="488" name="Constant_1084695" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="489" name="__module.model.layers.2.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="812,x2.9"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="490" name="Constant_1175856" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="491" name="__module.model.layers.2.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="813"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="492" name="Constant_1084588" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="493" name="Constant_1084632" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="494" name="Constant_1084634" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="495" name="__module.model.layers.2.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="807"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="496" name="__module.model.layers.2.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="815"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="497" name="__module.model.layers.2.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="816"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="498" name="__module.model.layers.2.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="817"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="499" name="ReadValue_1190108" type="ReadValue" version="opset6"> <data variable_id="past_key_values.2.keypresent.2.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.2.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="500" name="Constant_1189387" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="501" name="Gather_1189388" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="502" name="self.model.layers.2.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="887916304" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="503" name="Convert_1230392" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="504" name="self.model.layers.2.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="891062032" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="505" name="Convert_1230395" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="506" name="self.model.layers.2.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="507" name="self.model.layers.2.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="891063056" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="508" name="self.model.layers.2.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="509" name="__module.model.layers.2.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="510" name="__module.model.layers.2.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="788,key_states.13"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="511" name="Constant_1187728" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="512" name="__module.model.layers.2.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="795"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="513" name="__module.model.layers.2.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="514" name="__module.model.layers.2.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="796,k.5"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="515" name="__module.model.layers.2.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="818"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="516" name="Constant_1084834" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="517" name="Constant_1084836" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="518" name="Constant_1084838" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="519" name="__module.model.layers.2.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="828,x2.11"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="520" name="Constant_1175857" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="521" name="__module.model.layers.2.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="829"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="522" name="Constant_1084731" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="523" name="Constant_1084775" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="524" name="Constant_1084777" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="525" name="__module.model.layers.2.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="823"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="526" name="__module.model.layers.2.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="831"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="527" name="__module.model.layers.2.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="832"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="528" name="__module.model.layers.2.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="833"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="529" name="__module.model.layers.2.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="843,844,hidden_states.69,present.2.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="530" name="__module.model.layers.2.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="845,846,847"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="531" name="__module.model.layers.2.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="849,hidden_states.71"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="532" name="Constant_1187729" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="533" name="__module.model.layers.2.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="853,key_states.15"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="534" name="ReadValue_1190110" type="ReadValue" version="opset6"> <data variable_id="past_key_values.2.valuepresent.2.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.2.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="535" name="Constant_1189390" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="536" name="Gather_1189391" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="537" name="self.model.layers.2.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="891065104" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="538" name="Convert_1230382" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="539" name="self.model.layers.2.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="894210832" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="540" name="Convert_1230385" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="541" name="self.model.layers.2.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="542" name="self.model.layers.2.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="894211856" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="543" name="self.model.layers.2.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="544" name="__module.model.layers.2.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="545" name="__module.model.layers.2.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="790,value_states.5"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="546" name="Constant_1187730" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="547" name="__module.model.layers.2.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="798"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="548" name="__module.model.layers.2.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="549" name="__module.model.layers.2.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="799"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="550" name="__module.model.layers.2.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="859,860,hidden_states.73,present.2.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="551" name="__module.model.layers.2.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="861,862,863"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="552" name="__module.model.layers.2.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="865,hidden_states.75"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="553" name="Constant_1187731" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="554" name="__module.model.layers.2.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="869"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="555" name="__module.model.layers.2.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="875,attn_output.9"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="556" name="__module.model.layers.2.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="557" name="__module.model.layers.2.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="876"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="558" name="__module.model.layers.2.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="879"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="559" name="self.model.layers.2.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="894213904" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="560" name="Convert_1229592" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="561" name="self.model.layers.2.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="903651088" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="562" name="Convert_1229595" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="563" name="self.model.layers.2.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="564" name="self.model.layers.2.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="903654160" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="565" name="self.model.layers.2.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="566" name="__module.model.layers.2.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="567" name="__module.model.layers.2.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="881,883,hidden_states.77"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="568" name="__module.model.layers.2/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="886,888,899,hidden_states.79,hidden_states.81"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="569" name="Constant_1175861" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="903660304" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="570" name="Constant_1175860" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="571" name="Constant_1175858" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="572" name="__module.model.layers.2.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="889"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="573" name="Constant_1085437" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="890"> <dim>1</dim> </port> </output> </layer> <layer id="574" name="__module.model.layers.2.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="891,variance.11"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="575" name="Constant_1175859" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="576" name="__module.model.layers.2.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="892"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="577" name="__module.model.layers.2.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="578" name="__module.model.layers.2.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="893"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="579" name="__module.model.layers.2.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="894,895,hidden_states.83,hidden_states.85"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="580" name="__module.model.layers.2.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="896,898"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="581" name="self.model.layers.2.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="903672592" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="582" name="Convert_1228412" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="583" name="self.model.layers.2.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="974451472" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="584" name="Convert_1228415" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="585" name="self.model.layers.2.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="586" name="self.model.layers.2.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="974474512" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="587" name="self.model.layers.2.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="588" name="__module.model.layers.2.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="589" name="__module.model.layers.2.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="904,input.5"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="590" name="__module.model.layers.2.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="905"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="591" name="self.model.layers.2.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="974520592" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="592" name="Convert_1228402" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="593" name="self.model.layers.2.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="1045299472" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="594" name="Convert_1228405" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="595" name="self.model.layers.2.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="596" name="self.model.layers.2.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="1045322512" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="597" name="self.model.layers.2.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="598" name="__module.model.layers.2.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="599" name="__module.model.layers.2.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="907"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="600" name="__module.model.layers.2.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="908"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="601" name="self.model.layers.2.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="1045368592" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="602" name="Convert_1228422" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="603" name="self.model.layers.2.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1116147472" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="604" name="Convert_1228425" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="605" name="self.model.layers.2.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="606" name="self.model.layers.2.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1116150544" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="607" name="self.model.layers.2.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="608" name="__module.model.layers.2.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="609" name="__module.model.layers.2.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="910,hidden_states.87"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="610" name="__module.model.layers.2/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="911,913,921,932,hidden_states.89,hidden_states.91"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="611" name="Constant_1175865" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="1116156688" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="612" name="Constant_1175864" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="613" name="Constant_1175862" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="614" name="__module.model.layers.3.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="922"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="615" name="Constant_1085511" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="923"> <dim>1</dim> </port> </output> </layer> <layer id="616" name="__module.model.layers.3.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="924,variance.13"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="617" name="Constant_1175863" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="618" name="__module.model.layers.3.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="925"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="619" name="__module.model.layers.3.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="620" name="__module.model.layers.3.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="926"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="621" name="__module.model.layers.3.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="927,928,hidden_states.93,hidden_states.95"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="622" name="__module.model.layers.3.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="929,931,hidden_states.97"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="623" name="self.model.layers.3.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="1116168976" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="624" name="Convert_1229602" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="625" name="self.model.layers.3.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1125606160" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="626" name="Convert_1229605" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="627" name="self.model.layers.3.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="628" name="self.model.layers.3.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1125609232" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="629" name="self.model.layers.3.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="630" name="__module.model.layers.3.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="631" name="__module.model.layers.3.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="940,query_states.7"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="632" name="Constant_1187732" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="633" name="__module.model.layers.3.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="946"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="634" name="__module.model.layers.3.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="635" name="__module.model.layers.3.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="947,q.7"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="636" name="__module.model.layers.3.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="956"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="637" name="Constant_1085908" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="638" name="Constant_1085910" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="639" name="Constant_1085912" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="640" name="__module.model.layers.3.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="966,x2.13"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="641" name="Constant_1175866" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="642" name="__module.model.layers.3.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="967"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="643" name="Constant_1085805" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="644" name="Constant_1085849" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="645" name="Constant_1085851" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="646" name="__module.model.layers.3.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="961"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="647" name="__module.model.layers.3.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="969"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="648" name="__module.model.layers.3.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="970"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="649" name="__module.model.layers.3.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="971"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="650" name="ReadValue_1190152" type="ReadValue" version="opset6"> <data variable_id="past_key_values.3.keypresent.3.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.3.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="651" name="Constant_1189393" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="652" name="Gather_1189394" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="653" name="self.model.layers.3.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="1125615376" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="654" name="Convert_1230412" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="655" name="self.model.layers.3.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="1128761104" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="656" name="Convert_1230415" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="657" name="self.model.layers.3.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="658" name="self.model.layers.3.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="1128762128" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="659" name="self.model.layers.3.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="660" name="__module.model.layers.3.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="661" name="__module.model.layers.3.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="942,key_states.17"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="662" name="Constant_1187733" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="663" name="__module.model.layers.3.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="949"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="664" name="__module.model.layers.3.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="665" name="__module.model.layers.3.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="950,k.7"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="666" name="__module.model.layers.3.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="972"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="667" name="Constant_1086051" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="668" name="Constant_1086053" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="669" name="Constant_1086055" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="670" name="__module.model.layers.3.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="982,x2.15"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="671" name="Constant_1175867" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="672" name="__module.model.layers.3.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="983"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="673" name="Constant_1085948" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="674" name="Constant_1085992" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="675" name="Constant_1085994" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="676" name="__module.model.layers.3.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="977"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="677" name="__module.model.layers.3.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="985"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="678" name="__module.model.layers.3.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="986"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="679" name="__module.model.layers.3.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="987"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="680" name="__module.model.layers.3.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="997,998,hidden_states.99,present.3.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="681" name="__module.model.layers.3.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1000,1001,999"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="682" name="__module.model.layers.3.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1003,hidden_states.101"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="683" name="Constant_1187734" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="684" name="__module.model.layers.3.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1007,key_states.19"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="685" name="ReadValue_1190154" type="ReadValue" version="opset6"> <data variable_id="past_key_values.3.valuepresent.3.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.3.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="686" name="Constant_1189396" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="687" name="Gather_1189397" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="688" name="self.model.layers.3.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="1128764176" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="689" name="Convert_1230402" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="690" name="self.model.layers.3.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="1131909904" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="691" name="Convert_1230405" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="692" name="self.model.layers.3.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="693" name="self.model.layers.3.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="1131910928" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="694" name="self.model.layers.3.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="695" name="__module.model.layers.3.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="696" name="__module.model.layers.3.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="944,value_states.7"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="697" name="Constant_1187735" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="698" name="__module.model.layers.3.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="952"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="699" name="__module.model.layers.3.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="700" name="__module.model.layers.3.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="953"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="701" name="__module.model.layers.3.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1013,1014,hidden_states.103,present.3.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="702" name="__module.model.layers.3.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1015,1016,1017"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="703" name="__module.model.layers.3.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1019,hidden_states.105"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="704" name="Constant_1187736" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="705" name="__module.model.layers.3.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1023"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="706" name="__module.model.layers.3.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1029,attn_output.13"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="707" name="__module.model.layers.3.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="708" name="__module.model.layers.3.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1030"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="709" name="__module.model.layers.3.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1033"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="710" name="self.model.layers.3.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="1131912976" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="711" name="Convert_1229612" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="712" name="self.model.layers.3.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1141350160" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="713" name="Convert_1229615" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="714" name="self.model.layers.3.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="715" name="self.model.layers.3.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1141353232" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="716" name="self.model.layers.3.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="717" name="__module.model.layers.3.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="718" name="__module.model.layers.3.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1035,1037,hidden_states.107"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="719" name="__module.model.layers.3/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1040,1042,1053,hidden_states.109,hidden_states.111"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="720" name="Constant_1175871" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="1141359376" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="721" name="Constant_1175870" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="722" name="Constant_1175868" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="723" name="__module.model.layers.3.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1043"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="724" name="Constant_1086654" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1044"> <dim>1</dim> </port> </output> </layer> <layer id="725" name="__module.model.layers.3.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1045,variance.15"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="726" name="Constant_1175869" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="727" name="__module.model.layers.3.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1046"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="728" name="__module.model.layers.3.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="729" name="__module.model.layers.3.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1047"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="730" name="__module.model.layers.3.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1048,1049,hidden_states.113,hidden_states.115"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="731" name="__module.model.layers.3.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1050,1052"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="732" name="self.model.layers.3.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="1141371664" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="733" name="Convert_1228442" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="734" name="self.model.layers.3.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="1212150544" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="735" name="Convert_1228445" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="736" name="self.model.layers.3.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="737" name="self.model.layers.3.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="1212173584" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="738" name="self.model.layers.3.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="739" name="__module.model.layers.3.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="740" name="__module.model.layers.3.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1058,input.7"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="741" name="__module.model.layers.3.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="1059"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="742" name="self.model.layers.3.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="1212219664" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="743" name="Convert_1228432" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="744" name="self.model.layers.3.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="1282998544" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="745" name="Convert_1228435" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="746" name="self.model.layers.3.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="747" name="self.model.layers.3.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="1283021584" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="748" name="self.model.layers.3.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="749" name="__module.model.layers.3.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="750" name="__module.model.layers.3.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1061"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="751" name="__module.model.layers.3.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1062"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="752" name="self.model.layers.3.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="1283067664" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="753" name="Convert_1228452" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="754" name="self.model.layers.3.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1353846544" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="755" name="Convert_1228455" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="756" name="self.model.layers.3.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="757" name="self.model.layers.3.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1353849616" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="758" name="self.model.layers.3.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="759" name="__module.model.layers.3.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="760" name="__module.model.layers.3.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1064,hidden_states.117"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="761" name="__module.model.layers.3/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1065,1067,1075,1086,hidden_states.119,hidden_states.121"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="762" name="Constant_1175875" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="1353855760" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="763" name="Constant_1175874" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="764" name="Constant_1175872" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="765" name="__module.model.layers.4.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1076"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="766" name="Constant_1086728" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1077"> <dim>1</dim> </port> </output> </layer> <layer id="767" name="__module.model.layers.4.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1078,variance.17"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="768" name="Constant_1175873" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="769" name="__module.model.layers.4.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1079"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="770" name="__module.model.layers.4.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="771" name="__module.model.layers.4.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1080"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="772" name="__module.model.layers.4.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1081,1082,hidden_states.123,hidden_states.125"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="773" name="__module.model.layers.4.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1083,1085,hidden_states.127"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="774" name="self.model.layers.4.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="1353868048" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="775" name="Convert_1229622" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="776" name="self.model.layers.4.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1363305232" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="777" name="Convert_1229625" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="778" name="self.model.layers.4.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="779" name="self.model.layers.4.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1363308304" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="780" name="self.model.layers.4.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="781" name="__module.model.layers.4.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="782" name="__module.model.layers.4.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1094,query_states.9"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="783" name="Constant_1187737" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="784" name="__module.model.layers.4.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1100"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="785" name="__module.model.layers.4.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="786" name="__module.model.layers.4.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1101,q.9"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="787" name="__module.model.layers.4.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1110"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="788" name="Constant_1087125" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="789" name="Constant_1087127" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="790" name="Constant_1087129" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="791" name="__module.model.layers.4.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1120,x2.17"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="792" name="Constant_1175876" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="793" name="__module.model.layers.4.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1121"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="794" name="Constant_1087022" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="795" name="Constant_1087066" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="796" name="Constant_1087068" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="797" name="__module.model.layers.4.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1115"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="798" name="__module.model.layers.4.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1123"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="799" name="__module.model.layers.4.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1124"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="800" name="__module.model.layers.4.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1125"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="801" name="ReadValue_1190196" type="ReadValue" version="opset6"> <data variable_id="past_key_values.4.keypresent.4.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.4.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="802" name="Constant_1189399" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="803" name="Gather_1189400" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="804" name="self.model.layers.4.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="1363314448" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="805" name="Convert_1230432" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="806" name="self.model.layers.4.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="1366460176" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="807" name="Convert_1230435" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="808" name="self.model.layers.4.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="809" name="self.model.layers.4.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="1366461200" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="810" name="self.model.layers.4.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="811" name="__module.model.layers.4.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="812" name="__module.model.layers.4.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1096,key_states.21"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="813" name="Constant_1187738" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="814" name="__module.model.layers.4.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1103"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="815" name="__module.model.layers.4.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="816" name="__module.model.layers.4.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1104,k.9"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="817" name="__module.model.layers.4.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1126"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="818" name="Constant_1087268" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="819" name="Constant_1087270" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="820" name="Constant_1087272" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="821" name="__module.model.layers.4.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1136,x2.19"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="822" name="Constant_1175877" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="823" name="__module.model.layers.4.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1137"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="824" name="Constant_1087165" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="825" name="Constant_1087209" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="826" name="Constant_1087211" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="827" name="__module.model.layers.4.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1131"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="828" name="__module.model.layers.4.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1139"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="829" name="__module.model.layers.4.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1140"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="830" name="__module.model.layers.4.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1141"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="831" name="__module.model.layers.4.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1151,1152,hidden_states.129,present.4.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="832" name="__module.model.layers.4.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1153,1154,1155"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="833" name="__module.model.layers.4.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1157,hidden_states.131"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="834" name="Constant_1187739" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="835" name="__module.model.layers.4.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1161,key_states.23"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="836" name="ReadValue_1190198" type="ReadValue" version="opset6"> <data variable_id="past_key_values.4.valuepresent.4.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.4.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="837" name="Constant_1189402" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="838" name="Gather_1189403" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="839" name="self.model.layers.4.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="1366463248" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="840" name="Convert_1230422" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="841" name="self.model.layers.4.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="1369608976" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="842" name="Convert_1230425" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="843" name="self.model.layers.4.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="844" name="self.model.layers.4.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="1369610000" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="845" name="self.model.layers.4.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="846" name="__module.model.layers.4.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="847" name="__module.model.layers.4.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1098,value_states.9"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="848" name="Constant_1187740" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="849" name="__module.model.layers.4.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1106"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="850" name="__module.model.layers.4.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="851" name="__module.model.layers.4.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1107"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="852" name="__module.model.layers.4.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1167,1168,hidden_states.133,present.4.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="853" name="__module.model.layers.4.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1169,1170,1171"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="854" name="__module.model.layers.4.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1173,hidden_states.135"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="855" name="Constant_1187741" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="856" name="__module.model.layers.4.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1177"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="857" name="__module.model.layers.4.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1183,attn_output.17"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="858" name="__module.model.layers.4.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="859" name="__module.model.layers.4.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1184"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="860" name="__module.model.layers.4.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1187"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="861" name="self.model.layers.4.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="1369612048" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="862" name="Convert_1229632" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="863" name="self.model.layers.4.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1379049232" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="864" name="Convert_1229635" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="865" name="self.model.layers.4.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="866" name="self.model.layers.4.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1379052304" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="867" name="self.model.layers.4.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="868" name="__module.model.layers.4.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="869" name="__module.model.layers.4.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1189,1191,hidden_states.137"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="870" name="__module.model.layers.4/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1194,1196,1207,hidden_states.139,hidden_states.141"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="871" name="Constant_1175881" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="1379058448" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="872" name="Constant_1175880" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="873" name="Constant_1175878" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="874" name="__module.model.layers.4.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1197"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="875" name="Constant_1087871" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1198"> <dim>1</dim> </port> </output> </layer> <layer id="876" name="__module.model.layers.4.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1199,variance.19"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="877" name="Constant_1175879" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="878" name="__module.model.layers.4.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1200"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="879" name="__module.model.layers.4.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="880" name="__module.model.layers.4.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1201"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="881" name="__module.model.layers.4.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1202,1203,hidden_states.143,hidden_states.145"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="882" name="__module.model.layers.4.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1204,1206"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="883" name="self.model.layers.4.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="1379070736" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="884" name="Convert_1228472" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="885" name="self.model.layers.4.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="1449849616" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="886" name="Convert_1228475" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="887" name="self.model.layers.4.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="888" name="self.model.layers.4.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="1449872656" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="889" name="self.model.layers.4.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="890" name="__module.model.layers.4.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="891" name="__module.model.layers.4.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1212,input.9"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="892" name="__module.model.layers.4.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="1213"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="893" name="self.model.layers.4.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="1449918736" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="894" name="Convert_1228462" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="895" name="self.model.layers.4.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="1520697616" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="896" name="Convert_1228465" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="897" name="self.model.layers.4.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="898" name="self.model.layers.4.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="1520720656" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="899" name="self.model.layers.4.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="900" name="__module.model.layers.4.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="901" name="__module.model.layers.4.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1215"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="902" name="__module.model.layers.4.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1216"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="903" name="self.model.layers.4.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="1520766736" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="904" name="Convert_1228482" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="905" name="self.model.layers.4.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1591545616" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="906" name="Convert_1228485" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="907" name="self.model.layers.4.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="908" name="self.model.layers.4.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1591548688" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="909" name="self.model.layers.4.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="910" name="__module.model.layers.4.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="911" name="__module.model.layers.4.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1218,hidden_states.147"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="912" name="__module.model.layers.4/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1219,1221,1229,1240,hidden_states.149,hidden_states.151"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="913" name="Constant_1175885" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="1591554832" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="914" name="Constant_1175884" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="915" name="Constant_1175882" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="916" name="__module.model.layers.5.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1230"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="917" name="Constant_1087945" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1231"> <dim>1</dim> </port> </output> </layer> <layer id="918" name="__module.model.layers.5.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1232,variance.21"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="919" name="Constant_1175883" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="920" name="__module.model.layers.5.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1233"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="921" name="__module.model.layers.5.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="922" name="__module.model.layers.5.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1234"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="923" name="__module.model.layers.5.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1235,1236,hidden_states.153,hidden_states.155"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="924" name="__module.model.layers.5.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1237,1239,hidden_states.157"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="925" name="self.model.layers.5.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="1591567120" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="926" name="Convert_1229642" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="927" name="self.model.layers.5.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1601004304" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="928" name="Convert_1229645" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="929" name="self.model.layers.5.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="930" name="self.model.layers.5.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1601007376" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="931" name="self.model.layers.5.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="932" name="__module.model.layers.5.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="933" name="__module.model.layers.5.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1248,query_states.11"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="934" name="Constant_1187742" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="935" name="__module.model.layers.5.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1254"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="936" name="__module.model.layers.5.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="937" name="__module.model.layers.5.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1255,q.11"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="938" name="__module.model.layers.5.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1264"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="939" name="Constant_1088342" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="940" name="Constant_1088344" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="941" name="Constant_1088346" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="942" name="__module.model.layers.5.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1274,x2.21"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="943" name="Constant_1175886" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="944" name="__module.model.layers.5.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1275"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="945" name="Constant_1088239" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="946" name="Constant_1088283" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="947" name="Constant_1088285" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="948" name="__module.model.layers.5.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1269"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="949" name="__module.model.layers.5.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1277"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="950" name="__module.model.layers.5.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1278"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="951" name="__module.model.layers.5.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1279"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="952" name="ReadValue_1190200" type="ReadValue" version="opset6"> <data variable_id="past_key_values.5.keypresent.5.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.5.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="953" name="Constant_1189405" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="954" name="Gather_1189406" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="955" name="self.model.layers.5.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="1601013520" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="956" name="Convert_1230452" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="957" name="self.model.layers.5.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="1604159248" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="958" name="Convert_1230455" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="959" name="self.model.layers.5.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="960" name="self.model.layers.5.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="1604160272" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="961" name="self.model.layers.5.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="962" name="__module.model.layers.5.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="963" name="__module.model.layers.5.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1250,key_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="964" name="Constant_1187743" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="965" name="__module.model.layers.5.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1257"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="966" name="__module.model.layers.5.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="967" name="__module.model.layers.5.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1258,k.11"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="968" name="__module.model.layers.5.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1280"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="969" name="Constant_1088485" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="970" name="Constant_1088487" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="971" name="Constant_1088489" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="972" name="__module.model.layers.5.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1290,x2.23"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="973" name="Constant_1175887" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="974" name="__module.model.layers.5.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1291"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="975" name="Constant_1088382" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="976" name="Constant_1088426" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="977" name="Constant_1088428" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="978" name="__module.model.layers.5.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1285"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="979" name="__module.model.layers.5.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1293"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="980" name="__module.model.layers.5.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1294"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="981" name="__module.model.layers.5.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1295"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="982" name="__module.model.layers.5.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1305,1306,hidden_states.159,present.5.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="983" name="__module.model.layers.5.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1307,1308,1309"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="984" name="__module.model.layers.5.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1311,hidden_states.161"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="985" name="Constant_1187744" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="986" name="__module.model.layers.5.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1315,key_states.27"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="987" name="ReadValue_1190202" type="ReadValue" version="opset6"> <data variable_id="past_key_values.5.valuepresent.5.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.5.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="988" name="Constant_1189408" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="989" name="Gather_1189409" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="990" name="self.model.layers.5.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="1604162320" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="991" name="Convert_1230442" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="992" name="self.model.layers.5.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="1607308048" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="993" name="Convert_1230445" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="994" name="self.model.layers.5.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="995" name="self.model.layers.5.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="1607309072" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="996" name="self.model.layers.5.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="997" name="__module.model.layers.5.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="998" name="__module.model.layers.5.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1252,value_states.11"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="999" name="Constant_1187745" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1000" name="__module.model.layers.5.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1260"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1001" name="__module.model.layers.5.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1002" name="__module.model.layers.5.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1261"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1003" name="__module.model.layers.5.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1321,1322,hidden_states.163,present.5.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1004" name="__module.model.layers.5.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1323,1324,1325"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1005" name="__module.model.layers.5.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1327,hidden_states.165"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1006" name="Constant_1187746" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1007" name="__module.model.layers.5.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1331"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1008" name="__module.model.layers.5.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1337,attn_output.21"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1009" name="__module.model.layers.5.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1010" name="__module.model.layers.5.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1338"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1011" name="__module.model.layers.5.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1341"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1012" name="self.model.layers.5.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="1607311120" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1013" name="Convert_1229652" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1014" name="self.model.layers.5.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1616748304" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1015" name="Convert_1229655" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1016" name="self.model.layers.5.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1017" name="self.model.layers.5.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1616751376" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1018" name="self.model.layers.5.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1019" name="__module.model.layers.5.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1020" name="__module.model.layers.5.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1343,1345,hidden_states.167"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1021" name="__module.model.layers.5/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1348,1350,1361,hidden_states.169,hidden_states.171"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1022" name="Constant_1175891" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="1616757520" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1023" name="Constant_1175890" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1024" name="Constant_1175888" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1025" name="__module.model.layers.5.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1351"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1026" name="Constant_1089088" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1352"> <dim>1</dim> </port> </output> </layer> <layer id="1027" name="__module.model.layers.5.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1353,variance.23"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1028" name="Constant_1175889" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1029" name="__module.model.layers.5.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1354"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1030" name="__module.model.layers.5.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1031" name="__module.model.layers.5.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1355"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1032" name="__module.model.layers.5.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1356,1357,hidden_states.173,hidden_states.175"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1033" name="__module.model.layers.5.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1358,1360"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1034" name="self.model.layers.5.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="1616769808" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1035" name="Convert_1228502" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1036" name="self.model.layers.5.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="1687548688" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1037" name="Convert_1228505" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1038" name="self.model.layers.5.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1039" name="self.model.layers.5.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="1687571728" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1040" name="self.model.layers.5.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1041" name="__module.model.layers.5.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1042" name="__module.model.layers.5.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1366,input.11"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1043" name="__module.model.layers.5.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="1367"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1044" name="self.model.layers.5.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="1687617808" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1045" name="Convert_1228492" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1046" name="self.model.layers.5.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="1758396688" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1047" name="Convert_1228495" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1048" name="self.model.layers.5.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1049" name="self.model.layers.5.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="1758419728" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1050" name="self.model.layers.5.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1051" name="__module.model.layers.5.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1052" name="__module.model.layers.5.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1369"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1053" name="__module.model.layers.5.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1370"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1054" name="self.model.layers.5.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="1758465808" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1055" name="Convert_1228512" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1056" name="self.model.layers.5.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1829244688" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1057" name="Convert_1228515" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1058" name="self.model.layers.5.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1059" name="self.model.layers.5.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1829247760" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1060" name="self.model.layers.5.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1061" name="__module.model.layers.5.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1062" name="__module.model.layers.5.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1372,hidden_states.177"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1063" name="__module.model.layers.5/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1373,1375,1383,1394,hidden_states.179,hidden_states.181"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1064" name="Constant_1175895" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="1829253904" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1065" name="Constant_1175894" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1066" name="Constant_1175892" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1067" name="__module.model.layers.6.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1384"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1068" name="Constant_1089162" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1385"> <dim>1</dim> </port> </output> </layer> <layer id="1069" name="__module.model.layers.6.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1386,variance.25"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1070" name="Constant_1175893" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1071" name="__module.model.layers.6.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1387"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1072" name="__module.model.layers.6.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1073" name="__module.model.layers.6.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1388"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1074" name="__module.model.layers.6.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1389,1390,hidden_states.183,hidden_states.185"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1075" name="__module.model.layers.6.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1391,1393,hidden_states.187"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1076" name="self.model.layers.6.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="1829266192" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1077" name="Convert_1229662" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1078" name="self.model.layers.6.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1838703376" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1079" name="Convert_1229665" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1080" name="self.model.layers.6.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1081" name="self.model.layers.6.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1838706448" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1082" name="self.model.layers.6.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1083" name="__module.model.layers.6.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1084" name="__module.model.layers.6.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1402,query_states.13"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1085" name="Constant_1187747" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1086" name="__module.model.layers.6.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1408"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1087" name="__module.model.layers.6.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1088" name="__module.model.layers.6.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1409,q.13"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1089" name="__module.model.layers.6.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1418"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1090" name="Constant_1089559" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1091" name="Constant_1089561" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1092" name="Constant_1089563" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1093" name="__module.model.layers.6.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1428,x2.25"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1094" name="Constant_1175896" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1095" name="__module.model.layers.6.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1429"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1096" name="Constant_1089456" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1097" name="Constant_1089500" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1098" name="Constant_1089502" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1099" name="__module.model.layers.6.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1423"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1100" name="__module.model.layers.6.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1431"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1101" name="__module.model.layers.6.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1432"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1102" name="__module.model.layers.6.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1433"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1103" name="ReadValue_1190204" type="ReadValue" version="opset6"> <data variable_id="past_key_values.6.keypresent.6.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.6.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1104" name="Constant_1189411" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1105" name="Gather_1189412" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1106" name="self.model.layers.6.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="1838712592" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1107" name="Convert_1230472" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1108" name="self.model.layers.6.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="1841858320" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1109" name="Convert_1230475" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1110" name="self.model.layers.6.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1111" name="self.model.layers.6.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="1841859344" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1112" name="self.model.layers.6.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1113" name="__module.model.layers.6.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1114" name="__module.model.layers.6.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1404,key_states.29"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1115" name="Constant_1187748" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1116" name="__module.model.layers.6.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1411"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1117" name="__module.model.layers.6.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1118" name="__module.model.layers.6.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1412,k.13"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1119" name="__module.model.layers.6.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1434"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1120" name="Constant_1089702" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1121" name="Constant_1089704" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1122" name="Constant_1089706" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1123" name="__module.model.layers.6.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1444,x2.27"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1124" name="Constant_1175897" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1125" name="__module.model.layers.6.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1445"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1126" name="Constant_1089599" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1127" name="Constant_1089643" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1128" name="Constant_1089645" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1129" name="__module.model.layers.6.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1439"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1130" name="__module.model.layers.6.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1447"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1131" name="__module.model.layers.6.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1448"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1132" name="__module.model.layers.6.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1449"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1133" name="__module.model.layers.6.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1459,1460,hidden_states.189,present.6.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1134" name="__module.model.layers.6.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1461,1462,1463"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1135" name="__module.model.layers.6.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1465,hidden_states.191"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1136" name="Constant_1187749" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1137" name="__module.model.layers.6.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1469,key_states.31"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1138" name="ReadValue_1190206" type="ReadValue" version="opset6"> <data variable_id="past_key_values.6.valuepresent.6.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.6.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1139" name="Constant_1189414" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1140" name="Gather_1189415" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1141" name="self.model.layers.6.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="1841861392" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1142" name="Convert_1230462" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1143" name="self.model.layers.6.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="1845007120" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1144" name="Convert_1230465" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1145" name="self.model.layers.6.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1146" name="self.model.layers.6.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="1845008144" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1147" name="self.model.layers.6.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1148" name="__module.model.layers.6.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1149" name="__module.model.layers.6.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1406,value_states.13"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1150" name="Constant_1187750" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1151" name="__module.model.layers.6.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1414"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1152" name="__module.model.layers.6.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1153" name="__module.model.layers.6.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1415"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1154" name="__module.model.layers.6.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1475,1476,hidden_states.193,present.6.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1155" name="__module.model.layers.6.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1477,1478,1479"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1156" name="__module.model.layers.6.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1481,hidden_states.195"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1157" name="Constant_1187751" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1158" name="__module.model.layers.6.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1485"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1159" name="__module.model.layers.6.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1491,attn_output.25"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1160" name="__module.model.layers.6.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1161" name="__module.model.layers.6.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1492"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1162" name="__module.model.layers.6.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1495"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1163" name="self.model.layers.6.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="1845010192" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1164" name="Convert_1229672" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1165" name="self.model.layers.6.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="1854447376" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1166" name="Convert_1229675" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1167" name="self.model.layers.6.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1168" name="self.model.layers.6.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="1854450448" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1169" name="self.model.layers.6.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1170" name="__module.model.layers.6.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1171" name="__module.model.layers.6.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1497,1499,hidden_states.197"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1172" name="__module.model.layers.6/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1502,1504,1515,hidden_states.199,hidden_states.201"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1173" name="Constant_1175901" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="1854456592" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1174" name="Constant_1175900" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1175" name="Constant_1175898" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1176" name="__module.model.layers.6.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1505"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1177" name="Constant_1090305" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1506"> <dim>1</dim> </port> </output> </layer> <layer id="1178" name="__module.model.layers.6.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1507,variance.27"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1179" name="Constant_1175899" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1180" name="__module.model.layers.6.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1508"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1181" name="__module.model.layers.6.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1182" name="__module.model.layers.6.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1509"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1183" name="__module.model.layers.6.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1510,1511,hidden_states.203,hidden_states.205"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1184" name="__module.model.layers.6.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1512,1514"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1185" name="self.model.layers.6.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="1854468880" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1186" name="Convert_1228532" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1187" name="self.model.layers.6.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="1925247760" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1188" name="Convert_1228535" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1189" name="self.model.layers.6.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1190" name="self.model.layers.6.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="1925270800" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1191" name="self.model.layers.6.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1192" name="__module.model.layers.6.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1193" name="__module.model.layers.6.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1520,input.13"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1194" name="__module.model.layers.6.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="1521"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1195" name="self.model.layers.6.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="1925316880" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1196" name="Convert_1228522" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1197" name="self.model.layers.6.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="1996095760" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1198" name="Convert_1228525" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1199" name="self.model.layers.6.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1200" name="self.model.layers.6.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="1996118800" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1201" name="self.model.layers.6.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1202" name="__module.model.layers.6.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1203" name="__module.model.layers.6.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1523"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1204" name="__module.model.layers.6.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1524"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1205" name="self.model.layers.6.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="1996164880" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1206" name="Convert_1228542" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1207" name="self.model.layers.6.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2066943760" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1208" name="Convert_1228545" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1209" name="self.model.layers.6.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1210" name="self.model.layers.6.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2066946832" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1211" name="self.model.layers.6.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1212" name="__module.model.layers.6.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1213" name="__module.model.layers.6.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1526,hidden_states.207"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1214" name="__module.model.layers.6/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1527,1529,1537,1548,hidden_states.209,hidden_states.211"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1215" name="Constant_1175905" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="2066952976" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1216" name="Constant_1175904" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1217" name="Constant_1175902" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1218" name="__module.model.layers.7.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1538"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1219" name="Constant_1090379" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1539"> <dim>1</dim> </port> </output> </layer> <layer id="1220" name="__module.model.layers.7.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1540,variance.29"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1221" name="Constant_1175903" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1222" name="__module.model.layers.7.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1541"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1223" name="__module.model.layers.7.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1224" name="__module.model.layers.7.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1542"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1225" name="__module.model.layers.7.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1543,1544,hidden_states.213,hidden_states.215"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1226" name="__module.model.layers.7.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1545,1547,hidden_states.217"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1227" name="self.model.layers.7.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="2066965264" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1228" name="Convert_1229682" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1229" name="self.model.layers.7.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2076402448" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1230" name="Convert_1229685" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1231" name="self.model.layers.7.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1232" name="self.model.layers.7.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2076405520" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1233" name="self.model.layers.7.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1234" name="__module.model.layers.7.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1235" name="__module.model.layers.7.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1556,query_states.15"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1236" name="Constant_1187752" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1237" name="__module.model.layers.7.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1562"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1238" name="__module.model.layers.7.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1239" name="__module.model.layers.7.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1563,q.15"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1240" name="__module.model.layers.7.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1572"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1241" name="Constant_1090776" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1242" name="Constant_1090778" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1243" name="Constant_1090780" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1244" name="__module.model.layers.7.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1582,x2.29"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1245" name="Constant_1175906" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1246" name="__module.model.layers.7.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1583"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1247" name="Constant_1090673" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1248" name="Constant_1090717" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1249" name="Constant_1090719" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1250" name="__module.model.layers.7.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1577"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1251" name="__module.model.layers.7.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1585"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1252" name="__module.model.layers.7.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1586"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1253" name="__module.model.layers.7.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1587"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1254" name="ReadValue_1190208" type="ReadValue" version="opset6"> <data variable_id="past_key_values.7.keypresent.7.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.7.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1255" name="Constant_1189417" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1256" name="Gather_1189418" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1257" name="self.model.layers.7.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="2076411664" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1258" name="Convert_1230492" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1259" name="self.model.layers.7.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="2079557392" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1260" name="Convert_1230495" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1261" name="self.model.layers.7.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1262" name="self.model.layers.7.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="2079558416" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1263" name="self.model.layers.7.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1264" name="__module.model.layers.7.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1265" name="__module.model.layers.7.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1558,key_states.33"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1266" name="Constant_1187753" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1267" name="__module.model.layers.7.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1565"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1268" name="__module.model.layers.7.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1269" name="__module.model.layers.7.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1566,k.15"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1270" name="__module.model.layers.7.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1588"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1271" name="Constant_1090919" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1272" name="Constant_1090921" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1273" name="Constant_1090923" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1274" name="__module.model.layers.7.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1598,x2.31"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1275" name="Constant_1175907" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1276" name="__module.model.layers.7.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1599"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1277" name="Constant_1090816" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1278" name="Constant_1090860" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1279" name="Constant_1090862" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1280" name="__module.model.layers.7.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1593"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1281" name="__module.model.layers.7.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1601"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1282" name="__module.model.layers.7.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1602"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1283" name="__module.model.layers.7.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1603"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1284" name="__module.model.layers.7.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1613,1614,hidden_states.219,present.7.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1285" name="__module.model.layers.7.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1615,1616,1617"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1286" name="__module.model.layers.7.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1619,hidden_states.221"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1287" name="Constant_1187754" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1288" name="__module.model.layers.7.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1623,key_states.35"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1289" name="ReadValue_1190210" type="ReadValue" version="opset6"> <data variable_id="past_key_values.7.valuepresent.7.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.7.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1290" name="Constant_1189420" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1291" name="Gather_1189421" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1292" name="self.model.layers.7.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="2079560464" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1293" name="Convert_1230482" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1294" name="self.model.layers.7.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="2082706192" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1295" name="Convert_1230485" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1296" name="self.model.layers.7.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1297" name="self.model.layers.7.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="2082707216" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1298" name="self.model.layers.7.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1299" name="__module.model.layers.7.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1300" name="__module.model.layers.7.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1560,value_states.15"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1301" name="Constant_1187755" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1302" name="__module.model.layers.7.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1568"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1303" name="__module.model.layers.7.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1304" name="__module.model.layers.7.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1569"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1305" name="__module.model.layers.7.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1629,1630,hidden_states.223,present.7.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1306" name="__module.model.layers.7.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1631,1632,1633"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1307" name="__module.model.layers.7.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1635,hidden_states.225"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1308" name="Constant_1187756" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1309" name="__module.model.layers.7.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1639"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1310" name="__module.model.layers.7.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1645,attn_output.29"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1311" name="__module.model.layers.7.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1312" name="__module.model.layers.7.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1646"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1313" name="__module.model.layers.7.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1649"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1314" name="self.model.layers.7.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="2082709264" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1315" name="Convert_1229692" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1316" name="self.model.layers.7.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2092146448" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1317" name="Convert_1229695" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1318" name="self.model.layers.7.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1319" name="self.model.layers.7.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2092149520" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1320" name="self.model.layers.7.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1321" name="__module.model.layers.7.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1322" name="__module.model.layers.7.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1651,1653,hidden_states.227"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1323" name="__module.model.layers.7/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1656,1658,1669,hidden_states.229,hidden_states.231"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1324" name="Constant_1175911" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="2092155664" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1325" name="Constant_1175910" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1326" name="Constant_1175908" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1327" name="__module.model.layers.7.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1659"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1328" name="Constant_1091522" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1660"> <dim>1</dim> </port> </output> </layer> <layer id="1329" name="__module.model.layers.7.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1661,variance.31"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1330" name="Constant_1175909" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1331" name="__module.model.layers.7.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1662"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1332" name="__module.model.layers.7.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1333" name="__module.model.layers.7.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1663"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1334" name="__module.model.layers.7.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1664,1665,hidden_states.233,hidden_states.235"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1335" name="__module.model.layers.7.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1666,1668"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1336" name="self.model.layers.7.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="2092167952" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1337" name="Convert_1228562" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1338" name="self.model.layers.7.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="2162946832" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1339" name="Convert_1228565" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1340" name="self.model.layers.7.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1341" name="self.model.layers.7.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="2162969872" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1342" name="self.model.layers.7.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1343" name="__module.model.layers.7.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1344" name="__module.model.layers.7.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1674,input.15"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1345" name="__module.model.layers.7.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="1675"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1346" name="self.model.layers.7.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="2163015952" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1347" name="Convert_1228552" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1348" name="self.model.layers.7.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="2233794832" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1349" name="Convert_1228555" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1350" name="self.model.layers.7.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1351" name="self.model.layers.7.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="2233817872" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1352" name="self.model.layers.7.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1353" name="__module.model.layers.7.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1354" name="__module.model.layers.7.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1677"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1355" name="__module.model.layers.7.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1678"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1356" name="self.model.layers.7.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="2233863952" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1357" name="Convert_1228572" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1358" name="self.model.layers.7.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2304642832" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1359" name="Convert_1228575" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1360" name="self.model.layers.7.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1361" name="self.model.layers.7.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2304645904" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1362" name="self.model.layers.7.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1363" name="__module.model.layers.7.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1364" name="__module.model.layers.7.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1680,hidden_states.237"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1365" name="__module.model.layers.7/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1681,1683,1691,1702,hidden_states.239,hidden_states.241"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1366" name="Constant_1175915" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="2304652048" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1367" name="Constant_1175914" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1368" name="Constant_1175912" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1369" name="__module.model.layers.8.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1692"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1370" name="Constant_1091596" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1693"> <dim>1</dim> </port> </output> </layer> <layer id="1371" name="__module.model.layers.8.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1694,variance.33"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1372" name="Constant_1175913" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1373" name="__module.model.layers.8.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1695"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1374" name="__module.model.layers.8.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1375" name="__module.model.layers.8.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1696"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1376" name="__module.model.layers.8.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1697,1698,hidden_states.243,hidden_states.245"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1377" name="__module.model.layers.8.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1699,1701,hidden_states.247"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1378" name="self.model.layers.8.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="2304664336" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1379" name="Convert_1229702" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1380" name="self.model.layers.8.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2314101520" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1381" name="Convert_1229705" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1382" name="self.model.layers.8.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1383" name="self.model.layers.8.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2314104592" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1384" name="self.model.layers.8.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1385" name="__module.model.layers.8.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1386" name="__module.model.layers.8.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1710,query_states.17"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1387" name="Constant_1187757" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1388" name="__module.model.layers.8.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1716"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1389" name="__module.model.layers.8.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1390" name="__module.model.layers.8.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1717,q.17"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1391" name="__module.model.layers.8.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1726"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1392" name="Constant_1091993" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1393" name="Constant_1091995" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1394" name="Constant_1091997" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1395" name="__module.model.layers.8.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1736,x2.33"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1396" name="Constant_1175916" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1397" name="__module.model.layers.8.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1737"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1398" name="Constant_1091890" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1399" name="Constant_1091934" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1400" name="Constant_1091936" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1401" name="__module.model.layers.8.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1731"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1402" name="__module.model.layers.8.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1739"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1403" name="__module.model.layers.8.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1740"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1404" name="__module.model.layers.8.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1741"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1405" name="ReadValue_1190212" type="ReadValue" version="opset6"> <data variable_id="past_key_values.8.keypresent.8.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.8.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1406" name="Constant_1189423" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1407" name="Gather_1189424" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1408" name="self.model.layers.8.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="2314110736" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1409" name="Convert_1230512" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1410" name="self.model.layers.8.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="2317256464" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1411" name="Convert_1230515" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1412" name="self.model.layers.8.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1413" name="self.model.layers.8.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="2317257488" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1414" name="self.model.layers.8.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1415" name="__module.model.layers.8.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1416" name="__module.model.layers.8.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1712,key_states.37"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1417" name="Constant_1187758" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1418" name="__module.model.layers.8.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1719"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1419" name="__module.model.layers.8.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1420" name="__module.model.layers.8.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1720,k.17"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1421" name="__module.model.layers.8.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1742"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1422" name="Constant_1092136" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1423" name="Constant_1092138" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1424" name="Constant_1092140" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1425" name="__module.model.layers.8.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1752,x2.35"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1426" name="Constant_1175917" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1427" name="__module.model.layers.8.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1753"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1428" name="Constant_1092033" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1429" name="Constant_1092077" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1430" name="Constant_1092079" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1431" name="__module.model.layers.8.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1747"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1432" name="__module.model.layers.8.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1755"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1433" name="__module.model.layers.8.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1756"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1434" name="__module.model.layers.8.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1757"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1435" name="__module.model.layers.8.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1767,1768,hidden_states.249,present.8.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1436" name="__module.model.layers.8.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1769,1770,1771"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1437" name="__module.model.layers.8.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1773,hidden_states.251"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1438" name="Constant_1187759" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1439" name="__module.model.layers.8.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1777,key_states.39"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1440" name="ReadValue_1190214" type="ReadValue" version="opset6"> <data variable_id="past_key_values.8.valuepresent.8.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.8.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1441" name="Constant_1189426" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1442" name="Gather_1189427" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1443" name="self.model.layers.8.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="2317259536" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1444" name="Convert_1230502" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1445" name="self.model.layers.8.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="2320405264" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1446" name="Convert_1230505" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1447" name="self.model.layers.8.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1448" name="self.model.layers.8.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="2320406288" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1449" name="self.model.layers.8.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1450" name="__module.model.layers.8.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1451" name="__module.model.layers.8.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1714,value_states.17"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1452" name="Constant_1187760" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1453" name="__module.model.layers.8.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1722"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1454" name="__module.model.layers.8.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1455" name="__module.model.layers.8.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1723"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1456" name="__module.model.layers.8.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1783,1784,hidden_states.253,present.8.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1457" name="__module.model.layers.8.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1785,1786,1787"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1458" name="__module.model.layers.8.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1789,hidden_states.255"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1459" name="Constant_1187761" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1460" name="__module.model.layers.8.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1793"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1461" name="__module.model.layers.8.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1799,attn_output.33"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1462" name="__module.model.layers.8.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1463" name="__module.model.layers.8.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1800"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1464" name="__module.model.layers.8.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1803"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1465" name="self.model.layers.8.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="2320408336" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1466" name="Convert_1229712" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1467" name="self.model.layers.8.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2329845520" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1468" name="Convert_1229715" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1469" name="self.model.layers.8.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1470" name="self.model.layers.8.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2329848592" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1471" name="self.model.layers.8.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1472" name="__module.model.layers.8.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1473" name="__module.model.layers.8.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1805,1807,hidden_states.257"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1474" name="__module.model.layers.8/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1810,1812,1823,hidden_states.259,hidden_states.261"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1475" name="Constant_1175921" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="2329854736" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1476" name="Constant_1175920" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1477" name="Constant_1175918" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1478" name="__module.model.layers.8.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1813"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1479" name="Constant_1092739" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1814"> <dim>1</dim> </port> </output> </layer> <layer id="1480" name="__module.model.layers.8.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1815,variance.35"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1481" name="Constant_1175919" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1482" name="__module.model.layers.8.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1816"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1483" name="__module.model.layers.8.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1484" name="__module.model.layers.8.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1817"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1485" name="__module.model.layers.8.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1818,1819,hidden_states.263,hidden_states.265"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1486" name="__module.model.layers.8.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1820,1822"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1487" name="self.model.layers.8.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="2329867024" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1488" name="Convert_1228592" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1489" name="self.model.layers.8.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="2400645904" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1490" name="Convert_1228595" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1491" name="self.model.layers.8.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1492" name="self.model.layers.8.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="2400668944" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1493" name="self.model.layers.8.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1494" name="__module.model.layers.8.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1495" name="__module.model.layers.8.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1828,input.17"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1496" name="__module.model.layers.8.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="1829"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1497" name="self.model.layers.8.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="2400715024" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1498" name="Convert_1228582" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1499" name="self.model.layers.8.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="2471493904" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1500" name="Convert_1228585" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1501" name="self.model.layers.8.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1502" name="self.model.layers.8.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="2471516944" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1503" name="self.model.layers.8.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1504" name="__module.model.layers.8.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1505" name="__module.model.layers.8.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1831"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1506" name="__module.model.layers.8.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1832"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1507" name="self.model.layers.8.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="2471563024" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1508" name="Convert_1228602" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1509" name="self.model.layers.8.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2542341904" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1510" name="Convert_1228605" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1511" name="self.model.layers.8.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1512" name="self.model.layers.8.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2542344976" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1513" name="self.model.layers.8.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1514" name="__module.model.layers.8.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1515" name="__module.model.layers.8.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1834,hidden_states.267"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1516" name="__module.model.layers.8/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1835,1837,1845,1856,hidden_states.269,hidden_states.271"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1517" name="Constant_1175924" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1518" name="Constant_1175922" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1519" name="__module.model.layers.9.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1846"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1520" name="Constant_1092813" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1847"> <dim>1</dim> </port> </output> </layer> <layer id="1521" name="__module.model.layers.9.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1848,variance.37"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1522" name="Constant_1175923" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1523" name="__module.model.layers.9.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1849"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1524" name="__module.model.layers.9.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1525" name="__module.model.layers.9.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1850"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1526" name="__module.model.layers.9.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1851,1852,hidden_states.273,hidden_states.275"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1527" name="__module.model.layers.9.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1853,1855,hidden_states.277"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1528" name="self.model.layers.9.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="2542351120" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1529" name="Convert_1230522" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1530" name="self.model.layers.9.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="2545496848" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1531" name="Convert_1230525" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1532" name="self.model.layers.9.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1533" name="self.model.layers.9.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="2545497872" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1534" name="self.model.layers.9.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1535" name="__module.model.layers.9.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1536" name="__module.model.layers.9.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1868,value_states.19"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1537" name="Constant_1187765" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1538" name="__module.model.layers.9.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1876"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1539" name="__module.model.layers.9.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1540" name="__module.model.layers.9.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1877"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1541" name="__module.model.layers.9.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1937,1938,hidden_states.283,present.9.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1543" name="ReadValue_1190216" type="ReadValue" version="opset6"> <data variable_id="past_key_values.9.keypresent.9.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.9.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1544" name="Constant_1189429" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1545" name="Gather_1189430" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1546" name="self.model.layers.9.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="2545499920" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1547" name="Convert_1230532" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1548" name="self.model.layers.9.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="2548645648" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1549" name="Convert_1230535" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1550" name="self.model.layers.9.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1551" name="self.model.layers.9.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="2548646672" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1552" name="self.model.layers.9.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1553" name="__module.model.layers.9.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1554" name="__module.model.layers.9.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1866,key_states.41"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1555" name="Constant_1187763" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1556" name="__module.model.layers.9.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1873"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1557" name="__module.model.layers.9.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1558" name="__module.model.layers.9.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1874,k.19"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1559" name="__module.model.layers.9.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1896"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1560" name="Constant_1093353" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1561" name="Constant_1093355" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1562" name="Constant_1093357" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1563" name="__module.model.layers.9.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1906,x2.39"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1564" name="Constant_1175927" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1565" name="__module.model.layers.9.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1907"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1566" name="Constant_1093250" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1567" name="Constant_1093294" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1568" name="Constant_1093296" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1569" name="__module.model.layers.9.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1901"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1570" name="__module.model.layers.9.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1909"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1571" name="__module.model.layers.9.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1910"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1572" name="__module.model.layers.9.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1911"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1573" name="__module.model.layers.9.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1921,1922,hidden_states.279,present.9.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1585" name="ReadValue_1190194" type="ReadValue" version="opset6"> <data variable_id="past_key_values.39.valuepresent.39.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.39.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1586" name="Constant_1189612" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1587" name="Gather_1189613" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1588" name="Constant_1176225" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="2548648720" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1589" name="self.model.layers.9.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="2548661008" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1590" name="Convert_1229722" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1591" name="self.model.layers.9.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2558098192" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1592" name="Convert_1229725" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1593" name="self.model.layers.9.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1594" name="self.model.layers.9.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2558101264" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1595" name="self.model.layers.9.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1596" name="__module.model.layers.9.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1597" name="__module.model.layers.9.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1864,query_states.19"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1598" name="Constant_1187762" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1599" name="__module.model.layers.9.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1870"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1600" name="__module.model.layers.9.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1601" name="__module.model.layers.9.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1871,q.19"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1602" name="__module.model.layers.9.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1880"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1603" name="Constant_1093210" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1604" name="Constant_1093212" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1605" name="Constant_1093214" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1606" name="__module.model.layers.9.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1890,x2.37"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1607" name="Constant_1175926" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1608" name="__module.model.layers.9.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1891"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1609" name="Constant_1093107" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1610" name="Constant_1093151" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1611" name="Constant_1093153" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1612" name="__module.model.layers.9.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1885"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1613" name="__module.model.layers.9.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="1893"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1614" name="__module.model.layers.9.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1894"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1615" name="__module.model.layers.9.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="1895"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1616" name="__module.model.layers.9.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1923,1924,1925"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1617" name="__module.model.layers.9.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1927,hidden_states.281"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1618" name="Constant_1187764" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1619" name="__module.model.layers.9.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1931,key_states.43"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1620" name="__module.model.layers.9.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1939,1940,1941"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1621" name="__module.model.layers.9.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="1943,hidden_states.285"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1622" name="Constant_1187766" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1623" name="__module.model.layers.9.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1947"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1624" name="__module.model.layers.9.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1953,attn_output.37"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1625" name="__module.model.layers.9.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1626" name="__module.model.layers.9.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1954"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1627" name="__module.model.layers.9.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1957"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1628" name="self.model.layers.9.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="2558107408" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1629" name="Convert_1229732" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1630" name="self.model.layers.9.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2567544592" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1631" name="Convert_1229735" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1632" name="self.model.layers.9.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1633" name="self.model.layers.9.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2567547664" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1634" name="self.model.layers.9.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1635" name="__module.model.layers.9.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1636" name="__module.model.layers.9.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1959,1961,hidden_states.287"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1637" name="__module.model.layers.9/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1964,1966,1977,hidden_states.289,hidden_states.291"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1638" name="Constant_1175931" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="2567553808" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1639" name="Constant_1175930" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1640" name="Constant_1175928" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1641" name="__module.model.layers.9.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1967"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1642" name="Constant_1093956" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="1968"> <dim>1</dim> </port> </output> </layer> <layer id="1643" name="__module.model.layers.9.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1969,variance.39"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1644" name="Constant_1175929" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1645" name="__module.model.layers.9.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1970"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1646" name="__module.model.layers.9.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1647" name="__module.model.layers.9.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1971"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1648" name="__module.model.layers.9.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1972,1973,hidden_states.293,hidden_states.295"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1649" name="__module.model.layers.9.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1974,1976"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1650" name="self.model.layers.9.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="2567566096" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1651" name="Convert_1228622" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1652" name="self.model.layers.9.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="2638344976" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1653" name="Convert_1228625" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1654" name="self.model.layers.9.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1655" name="self.model.layers.9.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="2638368016" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1656" name="self.model.layers.9.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1657" name="__module.model.layers.9.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1658" name="__module.model.layers.9.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1982,input.19"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1659" name="__module.model.layers.9.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="1983"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1660" name="self.model.layers.9.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="2638414096" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1661" name="Convert_1228612" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1662" name="self.model.layers.9.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="2709192976" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1663" name="Convert_1228615" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1664" name="self.model.layers.9.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1665" name="self.model.layers.9.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="2709216016" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1666" name="self.model.layers.9.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1667" name="__module.model.layers.9.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1668" name="__module.model.layers.9.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1985"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1669" name="__module.model.layers.9.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1986"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1670" name="self.model.layers.9.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="2709262096" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1671" name="Convert_1228632" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1672" name="self.model.layers.9.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2780040976" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1673" name="Convert_1228635" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1674" name="self.model.layers.9.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1675" name="self.model.layers.9.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2780044048" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1676" name="self.model.layers.9.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1677" name="__module.model.layers.9.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1678" name="__module.model.layers.9.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="1988,hidden_states.297"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1679" name="__module.model.layers.9/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1989,1991,1999,2010,hidden_states.299,hidden_states.301"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1680" name="Constant_1175935" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="2780050192" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1681" name="Constant_1175934" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1682" name="Constant_1175932" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1683" name="__module.model.layers.10.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2000"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1684" name="Constant_1094030" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2001"> <dim>1</dim> </port> </output> </layer> <layer id="1685" name="__module.model.layers.10.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2002,variance.41"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1686" name="Constant_1175933" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1687" name="__module.model.layers.10.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2003"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1688" name="__module.model.layers.10.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1689" name="__module.model.layers.10.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2004"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1690" name="__module.model.layers.10.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2005,2006,hidden_states.303,hidden_states.305"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1691" name="__module.model.layers.10.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2007,2009,hidden_states.307"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1692" name="self.model.layers.10.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="2780062480" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1693" name="Convert_1229742" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1694" name="self.model.layers.10.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2789499664" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1695" name="Convert_1229745" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1696" name="self.model.layers.10.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1697" name="self.model.layers.10.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2789502736" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1698" name="self.model.layers.10.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1699" name="__module.model.layers.10.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1700" name="__module.model.layers.10.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2018,query_states.21"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1701" name="Constant_1187767" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1702" name="__module.model.layers.10.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2024"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1703" name="__module.model.layers.10.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1704" name="__module.model.layers.10.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2025,q.21"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1705" name="__module.model.layers.10.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2034"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1706" name="Constant_1094427" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1707" name="Constant_1094429" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1708" name="Constant_1094431" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1709" name="__module.model.layers.10.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2044,x2.41"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1710" name="Constant_1175936" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1711" name="__module.model.layers.10.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2045"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1712" name="Constant_1094324" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1713" name="Constant_1094368" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1714" name="Constant_1094370" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1715" name="__module.model.layers.10.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2039"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1716" name="__module.model.layers.10.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2047"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1717" name="__module.model.layers.10.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2048"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1718" name="__module.model.layers.10.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2049"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1719" name="ReadValue_1190068" type="ReadValue" version="opset6"> <data variable_id="past_key_values.10.keypresent.10.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.10.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1720" name="Constant_1189435" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1721" name="Gather_1189436" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1722" name="self.model.layers.10.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="2789508880" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1723" name="Convert_1230552" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1724" name="self.model.layers.10.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="2792654608" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1725" name="Convert_1230555" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1726" name="self.model.layers.10.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1727" name="self.model.layers.10.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="2792655632" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1728" name="self.model.layers.10.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1729" name="__module.model.layers.10.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1730" name="__module.model.layers.10.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2020,key_states.45"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1731" name="Constant_1187768" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1732" name="__module.model.layers.10.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2027"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1733" name="__module.model.layers.10.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1734" name="__module.model.layers.10.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2028,k.21"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1735" name="__module.model.layers.10.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2050"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1736" name="Constant_1094570" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1737" name="Constant_1094572" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1738" name="Constant_1094574" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1739" name="__module.model.layers.10.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2060,x2.43"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1740" name="Constant_1175937" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1741" name="__module.model.layers.10.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2061"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1742" name="Constant_1094467" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1743" name="Constant_1094511" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1744" name="Constant_1094513" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1745" name="__module.model.layers.10.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2055"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1746" name="__module.model.layers.10.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2063"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1747" name="__module.model.layers.10.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2064"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1748" name="__module.model.layers.10.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2065"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1749" name="__module.model.layers.10.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2075,2076,hidden_states.309,present.10.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1750" name="__module.model.layers.10.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2077,2078,2079"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1751" name="__module.model.layers.10.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2081,hidden_states.311"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1752" name="Constant_1187769" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1753" name="__module.model.layers.10.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2085,key_states.47"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1754" name="ReadValue_1190070" type="ReadValue" version="opset6"> <data variable_id="past_key_values.10.valuepresent.10.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.10.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1755" name="Constant_1189438" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1756" name="Gather_1189439" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1757" name="self.model.layers.10.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="2792657680" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1758" name="Convert_1230542" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1759" name="self.model.layers.10.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="2795803408" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1760" name="Convert_1230545" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1761" name="self.model.layers.10.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1762" name="self.model.layers.10.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="2795804432" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1763" name="self.model.layers.10.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1764" name="__module.model.layers.10.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1765" name="__module.model.layers.10.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2022,value_states.21"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1766" name="Constant_1187770" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1767" name="__module.model.layers.10.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2030"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1768" name="__module.model.layers.10.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1769" name="__module.model.layers.10.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2031"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1770" name="__module.model.layers.10.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2091,2092,hidden_states.313,present.10.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1771" name="__module.model.layers.10.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2093,2094,2095"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1772" name="__module.model.layers.10.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2097,hidden_states.315"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1773" name="Constant_1187771" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1774" name="__module.model.layers.10.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2101"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1775" name="__module.model.layers.10.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2107,attn_output.41"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1776" name="__module.model.layers.10.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1777" name="__module.model.layers.10.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2108"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1778" name="__module.model.layers.10.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2111"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1779" name="self.model.layers.10.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="2795806480" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1780" name="Convert_1229752" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1781" name="self.model.layers.10.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="2805243664" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1782" name="Convert_1229755" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1783" name="self.model.layers.10.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1784" name="self.model.layers.10.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="2805246736" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1785" name="self.model.layers.10.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1786" name="__module.model.layers.10.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1787" name="__module.model.layers.10.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2113,2115,hidden_states.317"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1788" name="__module.model.layers.10/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2118,2120,2131,hidden_states.319,hidden_states.321"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1789" name="Constant_1175941" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="2805252880" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1790" name="Constant_1175940" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1791" name="Constant_1175938" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1792" name="__module.model.layers.10.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2121"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1793" name="Constant_1095173" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2122"> <dim>1</dim> </port> </output> </layer> <layer id="1794" name="__module.model.layers.10.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2123,variance.43"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1795" name="Constant_1175939" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1796" name="__module.model.layers.10.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2124"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1797" name="__module.model.layers.10.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1798" name="__module.model.layers.10.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2125"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1799" name="__module.model.layers.10.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2126,2127,hidden_states.323,hidden_states.325"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1800" name="__module.model.layers.10.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2128,2130"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1801" name="self.model.layers.10.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="2805265168" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1802" name="Convert_1228652" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1803" name="self.model.layers.10.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="2876044048" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1804" name="Convert_1228655" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1805" name="self.model.layers.10.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1806" name="self.model.layers.10.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="2876067088" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1807" name="self.model.layers.10.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1808" name="__module.model.layers.10.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1809" name="__module.model.layers.10.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2136,input.21"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1810" name="__module.model.layers.10.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="2137"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1811" name="self.model.layers.10.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="2876113168" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1812" name="Convert_1228642" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1813" name="self.model.layers.10.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="2946892048" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1814" name="Convert_1228645" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1815" name="self.model.layers.10.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1816" name="self.model.layers.10.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="2946915088" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1817" name="self.model.layers.10.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1818" name="__module.model.layers.10.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1819" name="__module.model.layers.10.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2139"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1820" name="__module.model.layers.10.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2140"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1821" name="self.model.layers.10.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="2946961168" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1822" name="Convert_1228662" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1823" name="self.model.layers.10.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3017740048" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1824" name="Convert_1228665" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1825" name="self.model.layers.10.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1826" name="self.model.layers.10.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3017743120" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1827" name="self.model.layers.10.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1828" name="__module.model.layers.10.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1829" name="__module.model.layers.10.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2142,hidden_states.327"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1830" name="__module.model.layers.10/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2143,2145,2153,2164,hidden_states.329,hidden_states.331"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1831" name="Constant_1175945" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3017749264" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1832" name="Constant_1175944" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1833" name="Constant_1175942" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1834" name="__module.model.layers.11.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2154"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1835" name="Constant_1095247" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2155"> <dim>1</dim> </port> </output> </layer> <layer id="1836" name="__module.model.layers.11.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2156,variance.45"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1837" name="Constant_1175943" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1838" name="__module.model.layers.11.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2157"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1839" name="__module.model.layers.11.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1840" name="__module.model.layers.11.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2158"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1841" name="__module.model.layers.11.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2159,2160,hidden_states.333,hidden_states.335"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1842" name="__module.model.layers.11.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2161,2163,hidden_states.337"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1843" name="self.model.layers.11.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3017761552" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1844" name="Convert_1229762" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1845" name="self.model.layers.11.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3027198736" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1846" name="Convert_1229765" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1847" name="self.model.layers.11.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1848" name="self.model.layers.11.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3027201808" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1849" name="self.model.layers.11.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1850" name="__module.model.layers.11.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1851" name="__module.model.layers.11.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2172,query_states.23"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1852" name="Constant_1187772" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1853" name="__module.model.layers.11.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2178"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1854" name="__module.model.layers.11.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1855" name="__module.model.layers.11.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2179,q.23"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1856" name="__module.model.layers.11.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2188"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1857" name="Constant_1095644" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1858" name="Constant_1095646" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1859" name="Constant_1095648" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1860" name="__module.model.layers.11.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2198,x2.45"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1861" name="Constant_1175946" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1862" name="__module.model.layers.11.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2199"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1863" name="Constant_1095541" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1864" name="Constant_1095585" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1865" name="Constant_1095587" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1866" name="__module.model.layers.11.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2193"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1867" name="__module.model.layers.11.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2201"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1868" name="__module.model.layers.11.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2202"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1869" name="__module.model.layers.11.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2203"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1870" name="ReadValue_1190072" type="ReadValue" version="opset6"> <data variable_id="past_key_values.11.keypresent.11.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.11.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1871" name="Constant_1189441" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1872" name="Gather_1189442" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1873" name="self.model.layers.11.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3027207952" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1874" name="Convert_1230572" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1875" name="self.model.layers.11.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3030353680" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1876" name="Convert_1230575" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1877" name="self.model.layers.11.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1878" name="self.model.layers.11.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3030354704" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1879" name="self.model.layers.11.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1880" name="__module.model.layers.11.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1881" name="__module.model.layers.11.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2174,key_states.49"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1882" name="Constant_1187773" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1883" name="__module.model.layers.11.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2181"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1884" name="__module.model.layers.11.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1885" name="__module.model.layers.11.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2182,k.23"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1886" name="__module.model.layers.11.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2204"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1887" name="Constant_1095787" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1888" name="Constant_1095789" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1889" name="Constant_1095791" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1890" name="__module.model.layers.11.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2214,x2.47"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1891" name="Constant_1175947" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1892" name="__module.model.layers.11.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2215"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1893" name="Constant_1095684" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1894" name="Constant_1095728" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1895" name="Constant_1095730" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1896" name="__module.model.layers.11.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2209"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="1897" name="__module.model.layers.11.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2217"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1898" name="__module.model.layers.11.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2218"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1899" name="__module.model.layers.11.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2219"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1900" name="__module.model.layers.11.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2229,2230,hidden_states.339,present.11.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1901" name="__module.model.layers.11.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2231,2232,2233"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1902" name="__module.model.layers.11.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2235,hidden_states.341"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1903" name="Constant_1187774" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1904" name="__module.model.layers.11.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2239,key_states.51"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1905" name="ReadValue_1190074" type="ReadValue" version="opset6"> <data variable_id="past_key_values.11.valuepresent.11.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.11.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1906" name="Constant_1189444" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1907" name="Gather_1189445" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1908" name="self.model.layers.11.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3030356752" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1909" name="Convert_1230562" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1910" name="self.model.layers.11.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3033502480" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1911" name="Convert_1230565" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1912" name="self.model.layers.11.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1913" name="self.model.layers.11.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3033503504" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="1914" name="self.model.layers.11.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1915" name="__module.model.layers.11.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1916" name="__module.model.layers.11.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2176,value_states.23"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1917" name="Constant_1187775" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1918" name="__module.model.layers.11.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2184"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="1919" name="__module.model.layers.11.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1920" name="__module.model.layers.11.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2185"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1921" name="__module.model.layers.11.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2245,2246,hidden_states.343,present.11.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1922" name="__module.model.layers.11.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2247,2248,2249"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1923" name="__module.model.layers.11.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2251,hidden_states.345"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1924" name="Constant_1187776" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1925" name="__module.model.layers.11.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2255"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1926" name="__module.model.layers.11.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2261,attn_output.45"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1927" name="__module.model.layers.11.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1928" name="__module.model.layers.11.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2262"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="1929" name="__module.model.layers.11.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2265"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1930" name="self.model.layers.11.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3033505552" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1931" name="Convert_1229772" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1932" name="self.model.layers.11.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3042942736" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1933" name="Convert_1229775" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1934" name="self.model.layers.11.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1935" name="self.model.layers.11.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3042945808" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1936" name="self.model.layers.11.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1937" name="__module.model.layers.11.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1938" name="__module.model.layers.11.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2267,2269,hidden_states.347"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1939" name="__module.model.layers.11/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2272,2274,2285,hidden_states.349,hidden_states.351"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1940" name="Constant_1175951" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3042951952" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1941" name="Constant_1175950" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1942" name="Constant_1175948" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1943" name="__module.model.layers.11.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2275"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1944" name="Constant_1096390" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2276"> <dim>1</dim> </port> </output> </layer> <layer id="1945" name="__module.model.layers.11.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2277,variance.47"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1946" name="Constant_1175949" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1947" name="__module.model.layers.11.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2278"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1948" name="__module.model.layers.11.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1949" name="__module.model.layers.11.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2279"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1950" name="__module.model.layers.11.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2280,2281,hidden_states.353,hidden_states.355"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1951" name="__module.model.layers.11.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2282,2284"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1952" name="self.model.layers.11.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="3042964240" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1953" name="Convert_1228682" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1954" name="self.model.layers.11.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="3113743120" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1955" name="Convert_1228685" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1956" name="self.model.layers.11.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1957" name="self.model.layers.11.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="3113766160" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1958" name="self.model.layers.11.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1959" name="__module.model.layers.11.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1960" name="__module.model.layers.11.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2290,input.23"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1961" name="__module.model.layers.11.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="2291"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1962" name="self.model.layers.11.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="3113812240" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1963" name="Convert_1228672" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1964" name="self.model.layers.11.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="3184591120" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1965" name="Convert_1228675" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1966" name="self.model.layers.11.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1967" name="self.model.layers.11.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="3184614160" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="1968" name="self.model.layers.11.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1969" name="__module.model.layers.11.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1970" name="__module.model.layers.11.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2293"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1971" name="__module.model.layers.11.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2294"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1972" name="self.model.layers.11.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="3184660240" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1973" name="Convert_1228692" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1974" name="self.model.layers.11.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3255439120" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1975" name="Convert_1228695" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1976" name="self.model.layers.11.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1977" name="self.model.layers.11.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3255442192" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1978" name="self.model.layers.11.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1979" name="__module.model.layers.11.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="1980" name="__module.model.layers.11.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2296,hidden_states.357"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1981" name="__module.model.layers.11/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2297,2299,2307,2318,hidden_states.359,hidden_states.361"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1982" name="Constant_1175955" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3255448336" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1983" name="Constant_1175954" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1984" name="Constant_1175952" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1985" name="__module.model.layers.12.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2308"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1986" name="Constant_1096464" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2309"> <dim>1</dim> </port> </output> </layer> <layer id="1987" name="__module.model.layers.12.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2310,variance.49"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1988" name="Constant_1175953" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1989" name="__module.model.layers.12.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2311"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1990" name="__module.model.layers.12.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1991" name="__module.model.layers.12.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2312"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1992" name="__module.model.layers.12.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2313,2314,hidden_states.363,hidden_states.365"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1993" name="__module.model.layers.12.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2315,2317,hidden_states.367"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1994" name="self.model.layers.12.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3255460624" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1995" name="Convert_1229782" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1996" name="self.model.layers.12.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3264897808" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1997" name="Convert_1229785" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="1998" name="self.model.layers.12.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1999" name="self.model.layers.12.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3264900880" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2000" name="self.model.layers.12.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2001" name="__module.model.layers.12.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2002" name="__module.model.layers.12.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2326,query_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2003" name="Constant_1187777" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2004" name="__module.model.layers.12.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2332"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2005" name="__module.model.layers.12.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2006" name="__module.model.layers.12.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2333,q.25"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2007" name="__module.model.layers.12.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2342"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2008" name="Constant_1096861" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2009" name="Constant_1096863" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2010" name="Constant_1096865" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2011" name="__module.model.layers.12.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2352,x2.49"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2012" name="Constant_1175956" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2013" name="__module.model.layers.12.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2353"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2014" name="Constant_1096758" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2015" name="Constant_1096802" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2016" name="Constant_1096804" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2017" name="__module.model.layers.12.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2347"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2018" name="__module.model.layers.12.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2355"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2019" name="__module.model.layers.12.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2356"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2020" name="__module.model.layers.12.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2357"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2021" name="ReadValue_1190076" type="ReadValue" version="opset6"> <data variable_id="past_key_values.12.keypresent.12.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.12.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2022" name="Constant_1189447" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2023" name="Gather_1189448" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2024" name="self.model.layers.12.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3264907024" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2025" name="Convert_1230592" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2026" name="self.model.layers.12.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3268052752" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2027" name="Convert_1230595" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2028" name="self.model.layers.12.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2029" name="self.model.layers.12.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3268053776" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2030" name="self.model.layers.12.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2031" name="__module.model.layers.12.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2032" name="__module.model.layers.12.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2328,key_states.53"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2033" name="Constant_1187778" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2034" name="__module.model.layers.12.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2335"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2035" name="__module.model.layers.12.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2036" name="__module.model.layers.12.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2336,k.25"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2037" name="__module.model.layers.12.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2358"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2038" name="Constant_1097004" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2039" name="Constant_1097006" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2040" name="Constant_1097008" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2041" name="__module.model.layers.12.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2368,x2.51"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2042" name="Constant_1175957" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2043" name="__module.model.layers.12.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2369"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2044" name="Constant_1096901" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2045" name="Constant_1096945" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2046" name="Constant_1096947" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2047" name="__module.model.layers.12.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2363"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2048" name="__module.model.layers.12.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2371"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2049" name="__module.model.layers.12.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2372"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2050" name="__module.model.layers.12.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2373"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2051" name="__module.model.layers.12.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2383,2384,hidden_states.369,present.12.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2052" name="__module.model.layers.12.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2385,2386,2387"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2053" name="__module.model.layers.12.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2389,hidden_states.371"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2054" name="Constant_1187779" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2055" name="__module.model.layers.12.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2393,key_states.55"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2056" name="ReadValue_1190078" type="ReadValue" version="opset6"> <data variable_id="past_key_values.12.valuepresent.12.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.12.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2057" name="Constant_1189450" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2058" name="Gather_1189451" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2059" name="self.model.layers.12.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3268055824" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2060" name="Convert_1230582" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2061" name="self.model.layers.12.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3271201552" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2062" name="Convert_1230585" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2063" name="self.model.layers.12.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2064" name="self.model.layers.12.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3271202576" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2065" name="self.model.layers.12.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2066" name="__module.model.layers.12.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2067" name="__module.model.layers.12.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2330,value_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2068" name="Constant_1187780" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2069" name="__module.model.layers.12.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2338"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2070" name="__module.model.layers.12.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2071" name="__module.model.layers.12.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2339"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2072" name="__module.model.layers.12.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2399,2400,hidden_states.373,present.12.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2073" name="__module.model.layers.12.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2401,2402,2403"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2074" name="__module.model.layers.12.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2405,hidden_states.375"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2075" name="Constant_1187781" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2076" name="__module.model.layers.12.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2409"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2077" name="__module.model.layers.12.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2415,attn_output.49"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2078" name="__module.model.layers.12.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2079" name="__module.model.layers.12.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2416"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2080" name="__module.model.layers.12.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2419"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2081" name="self.model.layers.12.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3271204624" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2082" name="Convert_1229792" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2083" name="self.model.layers.12.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3280641808" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2084" name="Convert_1229795" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2085" name="self.model.layers.12.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2086" name="self.model.layers.12.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3280644880" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2087" name="self.model.layers.12.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2088" name="__module.model.layers.12.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2089" name="__module.model.layers.12.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2421,2423,hidden_states.377"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2090" name="__module.model.layers.12/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2426,2428,2439,hidden_states.379,hidden_states.381"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2091" name="Constant_1175961" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3280651024" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2092" name="Constant_1175960" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2093" name="Constant_1175958" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2094" name="__module.model.layers.12.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2429"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2095" name="Constant_1097607" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2430"> <dim>1</dim> </port> </output> </layer> <layer id="2096" name="__module.model.layers.12.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2431,variance.51"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2097" name="Constant_1175959" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2098" name="__module.model.layers.12.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2432"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2099" name="__module.model.layers.12.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2100" name="__module.model.layers.12.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2433"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2101" name="__module.model.layers.12.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2434,2435,hidden_states.383,hidden_states.385"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2102" name="__module.model.layers.12.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2436,2438"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2103" name="self.model.layers.12.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="3280663312" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2104" name="Convert_1228712" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2105" name="self.model.layers.12.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="3351442192" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2106" name="Convert_1228715" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2107" name="self.model.layers.12.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2108" name="self.model.layers.12.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="3351465232" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2109" name="self.model.layers.12.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2110" name="__module.model.layers.12.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2111" name="__module.model.layers.12.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2444,input.25"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2112" name="__module.model.layers.12.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="2445"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2113" name="self.model.layers.12.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="3351511312" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2114" name="Convert_1228702" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2115" name="self.model.layers.12.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="3422290192" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2116" name="Convert_1228705" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2117" name="self.model.layers.12.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2118" name="self.model.layers.12.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="3422313232" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2119" name="self.model.layers.12.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2120" name="__module.model.layers.12.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2121" name="__module.model.layers.12.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2447"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2122" name="__module.model.layers.12.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2448"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2123" name="self.model.layers.12.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="3422359312" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2124" name="Convert_1228722" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2125" name="self.model.layers.12.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3493138192" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2126" name="Convert_1228725" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2127" name="self.model.layers.12.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2128" name="self.model.layers.12.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3493141264" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2129" name="self.model.layers.12.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2130" name="__module.model.layers.12.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2131" name="__module.model.layers.12.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2450,hidden_states.387"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2132" name="__module.model.layers.12/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2451,2453,2461,2472,hidden_states.389,hidden_states.391"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2133" name="Constant_1175965" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3493147408" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2134" name="Constant_1175964" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2135" name="Constant_1175962" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2136" name="__module.model.layers.13.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2462"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2137" name="Constant_1097681" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2463"> <dim>1</dim> </port> </output> </layer> <layer id="2138" name="__module.model.layers.13.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2464,variance.53"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2139" name="Constant_1175963" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2140" name="__module.model.layers.13.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2465"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2141" name="__module.model.layers.13.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2142" name="__module.model.layers.13.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2466"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2143" name="__module.model.layers.13.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2467,2468,hidden_states.393,hidden_states.395"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2144" name="__module.model.layers.13.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2469,2471,hidden_states.397"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2145" name="self.model.layers.13.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3493159696" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2146" name="Convert_1229802" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2147" name="self.model.layers.13.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3502596880" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2148" name="Convert_1229805" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2149" name="self.model.layers.13.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2150" name="self.model.layers.13.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3502599952" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2151" name="self.model.layers.13.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2152" name="__module.model.layers.13.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2153" name="__module.model.layers.13.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2480,query_states.27"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2154" name="Constant_1187782" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2155" name="__module.model.layers.13.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2486"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2156" name="__module.model.layers.13.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2157" name="__module.model.layers.13.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2487,q.27"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2158" name="__module.model.layers.13.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2496"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2159" name="Constant_1098078" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2160" name="Constant_1098080" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2161" name="Constant_1098082" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2162" name="__module.model.layers.13.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2506,x2.53"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2163" name="Constant_1175966" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2164" name="__module.model.layers.13.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2507"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2165" name="Constant_1097975" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2166" name="Constant_1098019" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2167" name="Constant_1098021" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2168" name="__module.model.layers.13.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2501"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2169" name="__module.model.layers.13.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2509"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2170" name="__module.model.layers.13.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2510"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2171" name="__module.model.layers.13.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2511"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2172" name="ReadValue_1190080" type="ReadValue" version="opset6"> <data variable_id="past_key_values.13.keypresent.13.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.13.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2173" name="Constant_1189453" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2174" name="Gather_1189454" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2175" name="self.model.layers.13.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3502606096" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2176" name="Convert_1230612" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2177" name="self.model.layers.13.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3505751824" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2178" name="Convert_1230615" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2179" name="self.model.layers.13.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2180" name="self.model.layers.13.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3505752848" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2181" name="self.model.layers.13.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2182" name="__module.model.layers.13.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2183" name="__module.model.layers.13.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2482,key_states.57"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2184" name="Constant_1187783" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2185" name="__module.model.layers.13.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2489"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2186" name="__module.model.layers.13.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2187" name="__module.model.layers.13.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2490,k.27"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2188" name="__module.model.layers.13.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2512"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2189" name="Constant_1098221" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2190" name="Constant_1098223" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2191" name="Constant_1098225" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2192" name="__module.model.layers.13.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2522,x2.55"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2193" name="Constant_1175967" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2194" name="__module.model.layers.13.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2523"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2195" name="Constant_1098118" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2196" name="Constant_1098162" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2197" name="Constant_1098164" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2198" name="__module.model.layers.13.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2517"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2199" name="__module.model.layers.13.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2525"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2200" name="__module.model.layers.13.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2526"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2201" name="__module.model.layers.13.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2527"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2202" name="__module.model.layers.13.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2537,2538,hidden_states.399,present.13.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2203" name="__module.model.layers.13.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2539,2540,2541"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2204" name="__module.model.layers.13.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2543,hidden_states.401"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2205" name="Constant_1187784" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2206" name="__module.model.layers.13.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2547,key_states.59"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2207" name="ReadValue_1190082" type="ReadValue" version="opset6"> <data variable_id="past_key_values.13.valuepresent.13.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.13.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2208" name="Constant_1189456" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2209" name="Gather_1189457" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2210" name="self.model.layers.13.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3505754896" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2211" name="Convert_1230602" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2212" name="self.model.layers.13.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3508900624" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2213" name="Convert_1230605" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2214" name="self.model.layers.13.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2215" name="self.model.layers.13.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3508901648" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2216" name="self.model.layers.13.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2217" name="__module.model.layers.13.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2218" name="__module.model.layers.13.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2484,value_states.27"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2219" name="Constant_1187785" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2220" name="__module.model.layers.13.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2492"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2221" name="__module.model.layers.13.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2222" name="__module.model.layers.13.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2493"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2223" name="__module.model.layers.13.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2553,2554,hidden_states.403,present.13.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2224" name="__module.model.layers.13.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2555,2556,2557"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2225" name="__module.model.layers.13.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2559,hidden_states.405"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2226" name="Constant_1187786" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2227" name="__module.model.layers.13.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2563"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2228" name="__module.model.layers.13.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2569,attn_output.53"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2229" name="__module.model.layers.13.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2230" name="__module.model.layers.13.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2570"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2231" name="__module.model.layers.13.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2573"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2232" name="self.model.layers.13.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3508903696" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2233" name="Convert_1229812" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2234" name="self.model.layers.13.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3518340880" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2235" name="Convert_1229815" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2236" name="self.model.layers.13.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2237" name="self.model.layers.13.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3518343952" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2238" name="self.model.layers.13.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2239" name="__module.model.layers.13.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2240" name="__module.model.layers.13.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2575,2577,hidden_states.407"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2241" name="__module.model.layers.13/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2580,2582,2593,hidden_states.409,hidden_states.411"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2242" name="Constant_1175971" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3518350096" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2243" name="Constant_1175970" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2244" name="Constant_1175968" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2245" name="__module.model.layers.13.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2583"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2246" name="Constant_1098824" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2584"> <dim>1</dim> </port> </output> </layer> <layer id="2247" name="__module.model.layers.13.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2585,variance.55"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2248" name="Constant_1175969" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2249" name="__module.model.layers.13.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2586"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2250" name="__module.model.layers.13.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2251" name="__module.model.layers.13.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2587"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2252" name="__module.model.layers.13.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2588,2589,hidden_states.413,hidden_states.415"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2253" name="__module.model.layers.13.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2590,2592"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2254" name="self.model.layers.13.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="3518362384" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2255" name="Convert_1228742" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2256" name="self.model.layers.13.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="3589141264" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2257" name="Convert_1228745" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2258" name="self.model.layers.13.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2259" name="self.model.layers.13.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="3589164304" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2260" name="self.model.layers.13.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2261" name="__module.model.layers.13.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2262" name="__module.model.layers.13.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2598,input.27"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2263" name="__module.model.layers.13.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="2599"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2264" name="self.model.layers.13.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="3589210384" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2265" name="Convert_1228732" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2266" name="self.model.layers.13.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="3659989264" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2267" name="Convert_1228735" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2268" name="self.model.layers.13.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2269" name="self.model.layers.13.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="3660012304" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2270" name="self.model.layers.13.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2271" name="__module.model.layers.13.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2272" name="__module.model.layers.13.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2601"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2273" name="__module.model.layers.13.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2602"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2274" name="self.model.layers.13.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="3660058384" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2275" name="Convert_1228752" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2276" name="self.model.layers.13.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3730837264" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2277" name="Convert_1228755" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2278" name="self.model.layers.13.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2279" name="self.model.layers.13.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3730840336" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2280" name="self.model.layers.13.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2281" name="__module.model.layers.13.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2282" name="__module.model.layers.13.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2604,hidden_states.417"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2283" name="__module.model.layers.13/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2605,2607,2615,2626,hidden_states.419,hidden_states.421"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2284" name="Constant_1175975" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3730846480" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2285" name="Constant_1175974" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2286" name="Constant_1175972" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2287" name="__module.model.layers.14.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2616"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2288" name="Constant_1098898" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2617"> <dim>1</dim> </port> </output> </layer> <layer id="2289" name="__module.model.layers.14.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2618,variance.57"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2290" name="Constant_1175973" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2291" name="__module.model.layers.14.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2619"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2292" name="__module.model.layers.14.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2293" name="__module.model.layers.14.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2620"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2294" name="__module.model.layers.14.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2621,2622,hidden_states.423,hidden_states.425"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2295" name="__module.model.layers.14.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2623,2625,hidden_states.427"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2296" name="self.model.layers.14.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3730858768" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2297" name="Convert_1229822" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2298" name="self.model.layers.14.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3740295952" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2299" name="Convert_1229825" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2300" name="self.model.layers.14.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2301" name="self.model.layers.14.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3740299024" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2302" name="self.model.layers.14.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2303" name="__module.model.layers.14.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2304" name="__module.model.layers.14.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2634,query_states.29"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2305" name="Constant_1187787" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2306" name="__module.model.layers.14.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2640"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2307" name="__module.model.layers.14.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2308" name="__module.model.layers.14.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2641,q.29"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2309" name="__module.model.layers.14.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2650"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2310" name="Constant_1099295" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2311" name="Constant_1099297" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2312" name="Constant_1099299" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2313" name="__module.model.layers.14.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2660,x2.57"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2314" name="Constant_1175976" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2315" name="__module.model.layers.14.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2661"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2316" name="Constant_1099192" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2317" name="Constant_1099236" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2318" name="Constant_1099238" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2319" name="__module.model.layers.14.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2655"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2320" name="__module.model.layers.14.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2663"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2321" name="__module.model.layers.14.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2664"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2322" name="__module.model.layers.14.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2665"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2323" name="ReadValue_1190084" type="ReadValue" version="opset6"> <data variable_id="past_key_values.14.keypresent.14.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.14.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2324" name="Constant_1189459" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2325" name="Gather_1189460" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2326" name="self.model.layers.14.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3740305168" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2327" name="Convert_1230632" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2328" name="self.model.layers.14.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3743450896" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2329" name="Convert_1230635" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2330" name="self.model.layers.14.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2331" name="self.model.layers.14.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3743451920" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2332" name="self.model.layers.14.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2333" name="__module.model.layers.14.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2334" name="__module.model.layers.14.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2636,key_states.61"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2335" name="Constant_1187788" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2336" name="__module.model.layers.14.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2643"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2337" name="__module.model.layers.14.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2338" name="__module.model.layers.14.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2644,k.29"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2339" name="__module.model.layers.14.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2666"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2340" name="Constant_1099438" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2341" name="Constant_1099440" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2342" name="Constant_1099442" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2343" name="__module.model.layers.14.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2676,x2.59"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2344" name="Constant_1175977" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2345" name="__module.model.layers.14.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2677"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2346" name="Constant_1099335" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2347" name="Constant_1099379" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2348" name="Constant_1099381" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2349" name="__module.model.layers.14.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2671"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2350" name="__module.model.layers.14.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2679"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2351" name="__module.model.layers.14.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2680"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2352" name="__module.model.layers.14.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2681"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2353" name="__module.model.layers.14.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2691,2692,hidden_states.429,present.14.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2354" name="__module.model.layers.14.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2693,2694,2695"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2355" name="__module.model.layers.14.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2697,hidden_states.431"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2356" name="Constant_1187789" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2357" name="__module.model.layers.14.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2701,key_states.63"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2358" name="ReadValue_1190086" type="ReadValue" version="opset6"> <data variable_id="past_key_values.14.valuepresent.14.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.14.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2359" name="Constant_1189462" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2360" name="Gather_1189463" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2361" name="self.model.layers.14.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3743453968" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2362" name="Convert_1230622" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2363" name="self.model.layers.14.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3746599696" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2364" name="Convert_1230625" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2365" name="self.model.layers.14.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2366" name="self.model.layers.14.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3746600720" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2367" name="self.model.layers.14.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2368" name="__module.model.layers.14.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2369" name="__module.model.layers.14.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2638,value_states.29"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2370" name="Constant_1187790" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2371" name="__module.model.layers.14.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2646"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2372" name="__module.model.layers.14.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2373" name="__module.model.layers.14.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2647"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2374" name="__module.model.layers.14.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2707,2708,hidden_states.433,present.14.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2375" name="__module.model.layers.14.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2709,2710,2711"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2376" name="__module.model.layers.14.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2713,hidden_states.435"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2377" name="Constant_1187791" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2378" name="__module.model.layers.14.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2717"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2379" name="__module.model.layers.14.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2723,attn_output.57"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2380" name="__module.model.layers.14.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2381" name="__module.model.layers.14.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2724"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2382" name="__module.model.layers.14.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2727"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2383" name="self.model.layers.14.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3746602768" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2384" name="Convert_1229832" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2385" name="self.model.layers.14.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3756039952" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2386" name="Convert_1229835" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2387" name="self.model.layers.14.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2388" name="self.model.layers.14.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3756043024" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2389" name="self.model.layers.14.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2390" name="__module.model.layers.14.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2391" name="__module.model.layers.14.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2729,2731,hidden_states.437"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2392" name="__module.model.layers.14/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2734,2736,2747,hidden_states.439,hidden_states.441"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2393" name="Constant_1175981" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3756049168" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2394" name="Constant_1175980" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2395" name="Constant_1175978" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2396" name="__module.model.layers.14.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2737"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2397" name="Constant_1100041" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2738"> <dim>1</dim> </port> </output> </layer> <layer id="2398" name="__module.model.layers.14.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2739,variance.59"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2399" name="Constant_1175979" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2400" name="__module.model.layers.14.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2740"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2401" name="__module.model.layers.14.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2402" name="__module.model.layers.14.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2741"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2403" name="__module.model.layers.14.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2742,2743,hidden_states.443,hidden_states.445"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2404" name="__module.model.layers.14.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2744,2746"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2405" name="self.model.layers.14.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="3756061456" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2406" name="Convert_1228772" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2407" name="self.model.layers.14.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="3826840336" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2408" name="Convert_1228775" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2409" name="self.model.layers.14.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2410" name="self.model.layers.14.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="3826863376" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2411" name="self.model.layers.14.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2412" name="__module.model.layers.14.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2413" name="__module.model.layers.14.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2752,input.29"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2414" name="__module.model.layers.14.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="2753"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2415" name="self.model.layers.14.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="3826909456" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2416" name="Convert_1228762" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2417" name="self.model.layers.14.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="3897688336" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2418" name="Convert_1228765" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2419" name="self.model.layers.14.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2420" name="self.model.layers.14.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="3897711376" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2421" name="self.model.layers.14.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2422" name="__module.model.layers.14.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2423" name="__module.model.layers.14.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2755"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2424" name="__module.model.layers.14.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2756"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2425" name="self.model.layers.14.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="3897757456" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2426" name="Convert_1228782" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2427" name="self.model.layers.14.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3968536336" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2428" name="Convert_1228785" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2429" name="self.model.layers.14.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2430" name="self.model.layers.14.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3968539408" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2431" name="self.model.layers.14.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2432" name="__module.model.layers.14.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2433" name="__module.model.layers.14.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2758,hidden_states.447"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2434" name="__module.model.layers.14/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2759,2761,2769,2780,hidden_states.449,hidden_states.451"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2435" name="Constant_1175985" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3968545552" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2436" name="Constant_1175984" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2437" name="Constant_1175982" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2438" name="__module.model.layers.15.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2770"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2439" name="Constant_1100115" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2771"> <dim>1</dim> </port> </output> </layer> <layer id="2440" name="__module.model.layers.15.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2772,variance.61"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2441" name="Constant_1175983" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2442" name="__module.model.layers.15.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2773"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2443" name="__module.model.layers.15.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2444" name="__module.model.layers.15.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2774"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2445" name="__module.model.layers.15.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2775,2776,hidden_states.453,hidden_states.455"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2446" name="__module.model.layers.15.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2777,2779,hidden_states.457"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2447" name="self.model.layers.15.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3968557840" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2448" name="Convert_1229842" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2449" name="self.model.layers.15.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3977995024" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2450" name="Convert_1229845" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2451" name="self.model.layers.15.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2452" name="self.model.layers.15.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3977998096" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2453" name="self.model.layers.15.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2454" name="__module.model.layers.15.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2455" name="__module.model.layers.15.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2788,query_states.31"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2456" name="Constant_1187792" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2457" name="__module.model.layers.15.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2794"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2458" name="__module.model.layers.15.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2459" name="__module.model.layers.15.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2795,q.31"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2460" name="__module.model.layers.15.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2804"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2461" name="Constant_1100512" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2462" name="Constant_1100514" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2463" name="Constant_1100516" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2464" name="__module.model.layers.15.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2814,x2.61"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2465" name="Constant_1175986" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2466" name="__module.model.layers.15.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2815"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2467" name="Constant_1100409" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2468" name="Constant_1100453" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2469" name="Constant_1100455" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2470" name="__module.model.layers.15.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2809"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2471" name="__module.model.layers.15.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2817"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2472" name="__module.model.layers.15.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2818"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2473" name="__module.model.layers.15.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2819"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2474" name="ReadValue_1190088" type="ReadValue" version="opset6"> <data variable_id="past_key_values.15.keypresent.15.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.15.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2475" name="Constant_1189465" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2476" name="Gather_1189466" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2477" name="self.model.layers.15.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3978004240" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2478" name="Convert_1230652" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2479" name="self.model.layers.15.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3981149968" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2480" name="Convert_1230655" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2481" name="self.model.layers.15.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2482" name="self.model.layers.15.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3981150992" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2483" name="self.model.layers.15.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2484" name="__module.model.layers.15.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2485" name="__module.model.layers.15.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2790,key_states.65"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2486" name="Constant_1187793" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2487" name="__module.model.layers.15.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2797"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2488" name="__module.model.layers.15.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2489" name="__module.model.layers.15.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2798,k.31"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2490" name="__module.model.layers.15.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2820"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2491" name="Constant_1100655" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2492" name="Constant_1100657" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2493" name="Constant_1100659" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2494" name="__module.model.layers.15.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2830,x2.63"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2495" name="Constant_1175987" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2496" name="__module.model.layers.15.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2831"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2497" name="Constant_1100552" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2498" name="Constant_1100596" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2499" name="Constant_1100598" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2500" name="__module.model.layers.15.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2825"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2501" name="__module.model.layers.15.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2833"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2502" name="__module.model.layers.15.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2834"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2503" name="__module.model.layers.15.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2835"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2504" name="__module.model.layers.15.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2845,2846,hidden_states.459,present.15.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2505" name="__module.model.layers.15.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2847,2848,2849"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2506" name="__module.model.layers.15.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2851,hidden_states.461"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2507" name="Constant_1187794" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2508" name="__module.model.layers.15.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2855,key_states.67"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2509" name="ReadValue_1190090" type="ReadValue" version="opset6"> <data variable_id="past_key_values.15.valuepresent.15.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.15.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2510" name="Constant_1189468" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2511" name="Gather_1189469" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2512" name="self.model.layers.15.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="3981153040" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2513" name="Convert_1230642" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2514" name="self.model.layers.15.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="3984298768" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2515" name="Convert_1230645" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2516" name="self.model.layers.15.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2517" name="self.model.layers.15.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="3984299792" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2518" name="self.model.layers.15.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2519" name="__module.model.layers.15.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2520" name="__module.model.layers.15.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2792,value_states.31"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2521" name="Constant_1187795" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2522" name="__module.model.layers.15.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2800"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2523" name="__module.model.layers.15.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2524" name="__module.model.layers.15.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2801"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2525" name="__module.model.layers.15.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2861,2862,hidden_states.463,present.15.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2526" name="__module.model.layers.15.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="2863,2864,2865"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2527" name="__module.model.layers.15.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="2867,hidden_states.465"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2528" name="Constant_1187796" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2529" name="__module.model.layers.15.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2871"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2530" name="__module.model.layers.15.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2877,attn_output.61"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2531" name="__module.model.layers.15.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2532" name="__module.model.layers.15.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2878"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2533" name="__module.model.layers.15.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2881"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2534" name="self.model.layers.15.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="3984301840" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2535" name="Convert_1229852" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2536" name="self.model.layers.15.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="3993739024" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2537" name="Convert_1229855" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2538" name="self.model.layers.15.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2539" name="self.model.layers.15.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="3993742096" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2540" name="self.model.layers.15.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2541" name="__module.model.layers.15.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2542" name="__module.model.layers.15.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2883,2885,hidden_states.467"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2543" name="__module.model.layers.15/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2888,2890,2901,hidden_states.469,hidden_states.471"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2544" name="Constant_1175991" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="3993748240" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2545" name="Constant_1175990" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2546" name="Constant_1175988" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2547" name="__module.model.layers.15.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2891"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2548" name="Constant_1101258" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2892"> <dim>1</dim> </port> </output> </layer> <layer id="2549" name="__module.model.layers.15.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2893,variance.63"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2550" name="Constant_1175989" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2551" name="__module.model.layers.15.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2894"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2552" name="__module.model.layers.15.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2553" name="__module.model.layers.15.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2895"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2554" name="__module.model.layers.15.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2896,2897,hidden_states.473,hidden_states.475"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2555" name="__module.model.layers.15.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2898,2900"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2556" name="self.model.layers.15.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="3993760528" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2557" name="Convert_1228802" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2558" name="self.model.layers.15.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="4064539408" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2559" name="Convert_1228805" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2560" name="self.model.layers.15.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2561" name="self.model.layers.15.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="4064562448" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2562" name="self.model.layers.15.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2563" name="__module.model.layers.15.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2564" name="__module.model.layers.15.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2906,input.31"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2565" name="__module.model.layers.15.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="2907"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2566" name="self.model.layers.15.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="4064608528" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2567" name="Convert_1228792" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2568" name="self.model.layers.15.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="4135387408" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2569" name="Convert_1228795" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2570" name="self.model.layers.15.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2571" name="self.model.layers.15.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="4135410448" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2572" name="self.model.layers.15.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2573" name="__module.model.layers.15.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2574" name="__module.model.layers.15.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2909"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2575" name="__module.model.layers.15.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2910"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2576" name="self.model.layers.15.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="4135456528" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2577" name="Convert_1228812" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2578" name="self.model.layers.15.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4206235408" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2579" name="Convert_1228815" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2580" name="self.model.layers.15.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2581" name="self.model.layers.15.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4206238480" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2582" name="self.model.layers.15.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2583" name="__module.model.layers.15.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2584" name="__module.model.layers.15.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="2912,hidden_states.477"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2585" name="__module.model.layers.15/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2913,2915,2923,2934,hidden_states.479,hidden_states.481"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2586" name="Constant_1175995" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="4206244624" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2587" name="Constant_1175994" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2588" name="Constant_1175992" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2589" name="__module.model.layers.16.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2924"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2590" name="Constant_1101332" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="2925"> <dim>1</dim> </port> </output> </layer> <layer id="2591" name="__module.model.layers.16.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2926,variance.65"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2592" name="Constant_1175993" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2593" name="__module.model.layers.16.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2927"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2594" name="__module.model.layers.16.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2595" name="__module.model.layers.16.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2928"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2596" name="__module.model.layers.16.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2929,2930,hidden_states.483,hidden_states.485"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2597" name="__module.model.layers.16.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2931,2933,hidden_states.487"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2598" name="self.model.layers.16.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="4206256912" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2599" name="Convert_1229862" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2600" name="self.model.layers.16.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4215694096" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2601" name="Convert_1229865" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2602" name="self.model.layers.16.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2603" name="self.model.layers.16.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4215697168" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2604" name="self.model.layers.16.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2605" name="__module.model.layers.16.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2606" name="__module.model.layers.16.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2942,query_states.33"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2607" name="Constant_1187797" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2608" name="__module.model.layers.16.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2948"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2609" name="__module.model.layers.16.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2610" name="__module.model.layers.16.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2949,q.33"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2611" name="__module.model.layers.16.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2958"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2612" name="Constant_1101729" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2613" name="Constant_1101731" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2614" name="Constant_1101733" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2615" name="__module.model.layers.16.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2968,x2.65"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2616" name="Constant_1175996" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2617" name="__module.model.layers.16.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2969"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2618" name="Constant_1101626" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2619" name="Constant_1101670" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2620" name="Constant_1101672" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2621" name="__module.model.layers.16.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2963"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2622" name="__module.model.layers.16.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2971"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2623" name="__module.model.layers.16.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2972"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2624" name="__module.model.layers.16.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2973"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2625" name="ReadValue_1190092" type="ReadValue" version="opset6"> <data variable_id="past_key_values.16.keypresent.16.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.16.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2626" name="Constant_1189471" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2627" name="Gather_1189472" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2628" name="self.model.layers.16.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="4215703312" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2629" name="Convert_1230672" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2630" name="self.model.layers.16.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="4218849040" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2631" name="Convert_1230675" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2632" name="self.model.layers.16.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2633" name="self.model.layers.16.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="4218850064" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2634" name="self.model.layers.16.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2635" name="__module.model.layers.16.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2636" name="__module.model.layers.16.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2944,key_states.69"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2637" name="Constant_1187798" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2638" name="__module.model.layers.16.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2951"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2639" name="__module.model.layers.16.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2640" name="__module.model.layers.16.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2952,k.33"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2641" name="__module.model.layers.16.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2974"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2642" name="Constant_1101872" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2643" name="Constant_1101874" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2644" name="Constant_1101876" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2645" name="__module.model.layers.16.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2984,x2.67"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2646" name="Constant_1175997" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2647" name="__module.model.layers.16.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2985"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2648" name="Constant_1101769" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2649" name="Constant_1101813" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2650" name="Constant_1101815" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2651" name="__module.model.layers.16.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2979"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2652" name="__module.model.layers.16.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="2987"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2653" name="__module.model.layers.16.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2988"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2654" name="__module.model.layers.16.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2989"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2655" name="__module.model.layers.16.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="2999,3000,hidden_states.489,present.16.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2656" name="__module.model.layers.16.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3001,3002,3003"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2657" name="__module.model.layers.16.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3005,hidden_states.491"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2658" name="Constant_1187799" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2659" name="__module.model.layers.16.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3009,key_states.71"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2660" name="ReadValue_1190094" type="ReadValue" version="opset6"> <data variable_id="past_key_values.16.valuepresent.16.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.16.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2661" name="Constant_1189474" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2662" name="Gather_1189475" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2663" name="self.model.layers.16.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="4218852112" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2664" name="Convert_1230662" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2665" name="self.model.layers.16.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="4221997840" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2666" name="Convert_1230665" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2667" name="self.model.layers.16.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2668" name="self.model.layers.16.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="4221998864" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2669" name="self.model.layers.16.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2670" name="__module.model.layers.16.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2671" name="__module.model.layers.16.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2946,value_states.33"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2672" name="Constant_1187800" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2673" name="__module.model.layers.16.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2954"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2674" name="__module.model.layers.16.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2675" name="__module.model.layers.16.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2955"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2676" name="__module.model.layers.16.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3015,3016,hidden_states.493,present.16.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2677" name="__module.model.layers.16.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3017,3018,3019"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2678" name="__module.model.layers.16.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3021,hidden_states.495"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2679" name="Constant_1187801" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2680" name="__module.model.layers.16.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3025"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2681" name="__module.model.layers.16.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3031,attn_output.65"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2682" name="__module.model.layers.16.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2683" name="__module.model.layers.16.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3032"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2684" name="__module.model.layers.16.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3035"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2685" name="self.model.layers.16.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="4222000912" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2686" name="Convert_1229872" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2687" name="self.model.layers.16.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4231438096" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2688" name="Convert_1229875" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2689" name="self.model.layers.16.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2690" name="self.model.layers.16.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4231441168" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2691" name="self.model.layers.16.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2692" name="__module.model.layers.16.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2693" name="__module.model.layers.16.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3037,3039,hidden_states.497"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2694" name="__module.model.layers.16/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3042,3044,3055,hidden_states.499,hidden_states.501"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2695" name="Constant_1176001" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="4231447312" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2696" name="Constant_1176000" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2697" name="Constant_1175998" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2698" name="__module.model.layers.16.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3045"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2699" name="Constant_1102475" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3046"> <dim>1</dim> </port> </output> </layer> <layer id="2700" name="__module.model.layers.16.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3047,variance.67"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2701" name="Constant_1175999" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2702" name="__module.model.layers.16.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3048"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2703" name="__module.model.layers.16.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2704" name="__module.model.layers.16.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3049"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2705" name="__module.model.layers.16.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3050,3051,hidden_states.503,hidden_states.505"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2706" name="__module.model.layers.16.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3052,3054"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2707" name="self.model.layers.16.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="4231459600" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2708" name="Convert_1228832" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2709" name="self.model.layers.16.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="4302238480" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2710" name="Convert_1228835" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2711" name="self.model.layers.16.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2712" name="self.model.layers.16.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="4302261520" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2713" name="self.model.layers.16.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2714" name="__module.model.layers.16.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2715" name="__module.model.layers.16.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3060,input.33"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2716" name="__module.model.layers.16.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="3061"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2717" name="self.model.layers.16.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="4302307600" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2718" name="Convert_1228822" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2719" name="self.model.layers.16.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="4373086480" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2720" name="Convert_1228825" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2721" name="self.model.layers.16.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2722" name="self.model.layers.16.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="4373109520" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2723" name="self.model.layers.16.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2724" name="__module.model.layers.16.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2725" name="__module.model.layers.16.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3063"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2726" name="__module.model.layers.16.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3064"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2727" name="self.model.layers.16.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="4373155600" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2728" name="Convert_1228842" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2729" name="self.model.layers.16.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4443934480" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2730" name="Convert_1228845" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2731" name="self.model.layers.16.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2732" name="self.model.layers.16.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4443937552" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2733" name="self.model.layers.16.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2734" name="__module.model.layers.16.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2735" name="__module.model.layers.16.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3066,hidden_states.507"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2736" name="__module.model.layers.16/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3067,3069,3077,3088,hidden_states.509,hidden_states.511"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2737" name="Constant_1176005" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="4443943696" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2738" name="Constant_1176004" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2739" name="Constant_1176002" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2740" name="__module.model.layers.17.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3078"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2741" name="Constant_1102549" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3079"> <dim>1</dim> </port> </output> </layer> <layer id="2742" name="__module.model.layers.17.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3080,variance.69"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2743" name="Constant_1176003" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2744" name="__module.model.layers.17.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3081"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2745" name="__module.model.layers.17.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2746" name="__module.model.layers.17.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3082"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2747" name="__module.model.layers.17.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3083,3084,hidden_states.513,hidden_states.515"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2748" name="__module.model.layers.17.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3085,3087,hidden_states.517"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2749" name="self.model.layers.17.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="4443955984" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2750" name="Convert_1229882" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2751" name="self.model.layers.17.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4453393168" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2752" name="Convert_1229885" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2753" name="self.model.layers.17.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2754" name="self.model.layers.17.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4453396240" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2755" name="self.model.layers.17.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2756" name="__module.model.layers.17.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2757" name="__module.model.layers.17.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3096,query_states.35"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2758" name="Constant_1187802" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2759" name="__module.model.layers.17.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3102"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2760" name="__module.model.layers.17.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2761" name="__module.model.layers.17.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3103,q.35"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2762" name="__module.model.layers.17.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3112"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2763" name="Constant_1102946" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2764" name="Constant_1102948" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2765" name="Constant_1102950" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2766" name="__module.model.layers.17.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3122,x2.69"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2767" name="Constant_1176006" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2768" name="__module.model.layers.17.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3123"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2769" name="Constant_1102843" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2770" name="Constant_1102887" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2771" name="Constant_1102889" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2772" name="__module.model.layers.17.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3117"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2773" name="__module.model.layers.17.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3125"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2774" name="__module.model.layers.17.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3126"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2775" name="__module.model.layers.17.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3127"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2776" name="ReadValue_1190096" type="ReadValue" version="opset6"> <data variable_id="past_key_values.17.keypresent.17.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.17.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2777" name="Constant_1189477" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2778" name="Gather_1189478" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2779" name="self.model.layers.17.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="4453402384" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2780" name="Convert_1230692" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2781" name="self.model.layers.17.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="4456548112" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2782" name="Convert_1230695" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2783" name="self.model.layers.17.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2784" name="self.model.layers.17.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="4456549136" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2785" name="self.model.layers.17.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2786" name="__module.model.layers.17.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2787" name="__module.model.layers.17.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3098,key_states.73"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2788" name="Constant_1187803" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2789" name="__module.model.layers.17.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3105"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2790" name="__module.model.layers.17.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2791" name="__module.model.layers.17.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3106,k.35"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2792" name="__module.model.layers.17.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3128"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2793" name="Constant_1103089" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2794" name="Constant_1103091" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2795" name="Constant_1103093" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2796" name="__module.model.layers.17.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3138,x2.71"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2797" name="Constant_1176007" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2798" name="__module.model.layers.17.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3139"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2799" name="Constant_1102986" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2800" name="Constant_1103030" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2801" name="Constant_1103032" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2802" name="__module.model.layers.17.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3133"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2803" name="__module.model.layers.17.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3141"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2804" name="__module.model.layers.17.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3142"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2805" name="__module.model.layers.17.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3143"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2806" name="__module.model.layers.17.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3153,3154,hidden_states.519,present.17.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2807" name="__module.model.layers.17.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3155,3156,3157"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2808" name="__module.model.layers.17.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3159,hidden_states.521"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2809" name="Constant_1187804" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2810" name="__module.model.layers.17.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3163,key_states.75"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2811" name="ReadValue_1190098" type="ReadValue" version="opset6"> <data variable_id="past_key_values.17.valuepresent.17.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.17.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2812" name="Constant_1189480" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2813" name="Gather_1189481" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2814" name="self.model.layers.17.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="4456551184" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2815" name="Convert_1230682" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2816" name="self.model.layers.17.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="4459696912" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2817" name="Convert_1230685" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2818" name="self.model.layers.17.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2819" name="self.model.layers.17.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="4459697936" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2820" name="self.model.layers.17.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2821" name="__module.model.layers.17.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2822" name="__module.model.layers.17.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3100,value_states.35"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2823" name="Constant_1187805" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2824" name="__module.model.layers.17.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3108"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2825" name="__module.model.layers.17.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2826" name="__module.model.layers.17.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3109"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2827" name="__module.model.layers.17.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3169,3170,hidden_states.523,present.17.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2828" name="__module.model.layers.17.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3171,3172,3173"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2829" name="__module.model.layers.17.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3175,hidden_states.525"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2830" name="Constant_1187806" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2831" name="__module.model.layers.17.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3179"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2832" name="__module.model.layers.17.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3185,attn_output.69"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2833" name="__module.model.layers.17.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2834" name="__module.model.layers.17.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3186"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2835" name="__module.model.layers.17.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3189"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2836" name="self.model.layers.17.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="4459699984" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2837" name="Convert_1229892" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2838" name="self.model.layers.17.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4469137168" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2839" name="Convert_1229895" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2840" name="self.model.layers.17.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2841" name="self.model.layers.17.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4469140240" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2842" name="self.model.layers.17.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2843" name="__module.model.layers.17.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2844" name="__module.model.layers.17.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3191,3193,hidden_states.527"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2845" name="__module.model.layers.17/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3196,3198,3209,hidden_states.529,hidden_states.531"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2846" name="Constant_1176011" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="4469146384" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2847" name="Constant_1176010" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2848" name="Constant_1176008" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2849" name="__module.model.layers.17.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3199"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2850" name="Constant_1103692" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3200"> <dim>1</dim> </port> </output> </layer> <layer id="2851" name="__module.model.layers.17.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3201,variance.71"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2852" name="Constant_1176009" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2853" name="__module.model.layers.17.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3202"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2854" name="__module.model.layers.17.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2855" name="__module.model.layers.17.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3203"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2856" name="__module.model.layers.17.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3204,3205,hidden_states.533,hidden_states.535"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2857" name="__module.model.layers.17.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3206,3208"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2858" name="self.model.layers.17.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="4469158672" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2859" name="Convert_1228862" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2860" name="self.model.layers.17.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="4539937552" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2861" name="Convert_1228865" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2862" name="self.model.layers.17.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2863" name="self.model.layers.17.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="4539960592" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2864" name="self.model.layers.17.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2865" name="__module.model.layers.17.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2866" name="__module.model.layers.17.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3214,input.35"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2867" name="__module.model.layers.17.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="3215"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2868" name="self.model.layers.17.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="4540006672" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2869" name="Convert_1228852" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2870" name="self.model.layers.17.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="4610785552" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2871" name="Convert_1228855" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2872" name="self.model.layers.17.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2873" name="self.model.layers.17.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="4610808592" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="2874" name="self.model.layers.17.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2875" name="__module.model.layers.17.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2876" name="__module.model.layers.17.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3217"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2877" name="__module.model.layers.17.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3218"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2878" name="self.model.layers.17.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="4610854672" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2879" name="Convert_1228872" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2880" name="self.model.layers.17.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4681633552" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2881" name="Convert_1228875" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2882" name="self.model.layers.17.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2883" name="self.model.layers.17.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4681636624" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2884" name="self.model.layers.17.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2885" name="__module.model.layers.17.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="2886" name="__module.model.layers.17.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3220,hidden_states.537"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2887" name="__module.model.layers.17/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3221,3223,3231,3242,hidden_states.539,hidden_states.541"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2888" name="Constant_1176015" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="4681642768" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2889" name="Constant_1176014" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2890" name="Constant_1176012" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2891" name="__module.model.layers.18.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3232"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2892" name="Constant_1103766" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3233"> <dim>1</dim> </port> </output> </layer> <layer id="2893" name="__module.model.layers.18.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3234,variance.73"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2894" name="Constant_1176013" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2895" name="__module.model.layers.18.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3235"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2896" name="__module.model.layers.18.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2897" name="__module.model.layers.18.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3236"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2898" name="__module.model.layers.18.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3237,3238,hidden_states.543,hidden_states.545"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2899" name="__module.model.layers.18.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3239,3241,hidden_states.547"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2900" name="self.model.layers.18.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="4681655056" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2901" name="Convert_1229902" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2902" name="self.model.layers.18.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4691092240" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2903" name="Convert_1229905" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2904" name="self.model.layers.18.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2905" name="self.model.layers.18.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4691095312" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2906" name="self.model.layers.18.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2907" name="__module.model.layers.18.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2908" name="__module.model.layers.18.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3250,query_states.37"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2909" name="Constant_1187807" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2910" name="__module.model.layers.18.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3256"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2911" name="__module.model.layers.18.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2912" name="__module.model.layers.18.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3257,q.37"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2913" name="__module.model.layers.18.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3266"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2914" name="Constant_1104163" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2915" name="Constant_1104165" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2916" name="Constant_1104167" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2917" name="__module.model.layers.18.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3276,x2.73"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2918" name="Constant_1176016" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2919" name="__module.model.layers.18.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3277"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2920" name="Constant_1104060" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2921" name="Constant_1104104" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2922" name="Constant_1104106" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2923" name="__module.model.layers.18.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3271"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2924" name="__module.model.layers.18.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3279"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2925" name="__module.model.layers.18.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3280"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2926" name="__module.model.layers.18.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3281"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2927" name="ReadValue_1190100" type="ReadValue" version="opset6"> <data variable_id="past_key_values.18.keypresent.18.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.18.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2928" name="Constant_1189483" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2929" name="Gather_1189484" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2930" name="self.model.layers.18.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="4691101456" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2931" name="Convert_1230712" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2932" name="self.model.layers.18.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="4694247184" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2933" name="Convert_1230715" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2934" name="self.model.layers.18.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2935" name="self.model.layers.18.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="4694248208" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2936" name="self.model.layers.18.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2937" name="__module.model.layers.18.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2938" name="__module.model.layers.18.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3252,key_states.77"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2939" name="Constant_1187808" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2940" name="__module.model.layers.18.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3259"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2941" name="__module.model.layers.18.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2942" name="__module.model.layers.18.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3260,k.37"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2943" name="__module.model.layers.18.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3282"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2944" name="Constant_1104306" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2945" name="Constant_1104308" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2946" name="Constant_1104310" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2947" name="__module.model.layers.18.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3292,x2.75"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2948" name="Constant_1176017" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2949" name="__module.model.layers.18.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3293"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2950" name="Constant_1104203" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2951" name="Constant_1104247" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2952" name="Constant_1104249" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2953" name="__module.model.layers.18.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3287"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="2954" name="__module.model.layers.18.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3295"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2955" name="__module.model.layers.18.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3296"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2956" name="__module.model.layers.18.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3297"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2957" name="__module.model.layers.18.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3307,3308,hidden_states.549,present.18.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2958" name="__module.model.layers.18.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3309,3310,3311"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2959" name="__module.model.layers.18.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3313,hidden_states.551"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2960" name="Constant_1187809" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2961" name="__module.model.layers.18.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3317,key_states.79"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2962" name="ReadValue_1190102" type="ReadValue" version="opset6"> <data variable_id="past_key_values.18.valuepresent.18.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.18.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2963" name="Constant_1189486" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2964" name="Gather_1189487" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2965" name="self.model.layers.18.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="4694250256" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2966" name="Convert_1230702" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2967" name="self.model.layers.18.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="4697395984" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2968" name="Convert_1230705" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2969" name="self.model.layers.18.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2970" name="self.model.layers.18.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="4697397008" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="2971" name="self.model.layers.18.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2972" name="__module.model.layers.18.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2973" name="__module.model.layers.18.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3254,value_states.37"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2974" name="Constant_1187810" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2975" name="__module.model.layers.18.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3262"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="2976" name="__module.model.layers.18.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2977" name="__module.model.layers.18.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3263"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2978" name="__module.model.layers.18.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3323,3324,hidden_states.553,present.18.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2979" name="__module.model.layers.18.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3325,3326,3327"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2980" name="__module.model.layers.18.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3329,hidden_states.555"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2981" name="Constant_1187811" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2982" name="__module.model.layers.18.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3333"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2983" name="__module.model.layers.18.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3339,attn_output.73"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="2984" name="__module.model.layers.18.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2985" name="__module.model.layers.18.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3340"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="2986" name="__module.model.layers.18.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3343"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2987" name="self.model.layers.18.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="4697399056" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2988" name="Convert_1229912" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2989" name="self.model.layers.18.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4706836240" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2990" name="Convert_1229915" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2991" name="self.model.layers.18.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2992" name="self.model.layers.18.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4706839312" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="2993" name="self.model.layers.18.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2994" name="__module.model.layers.18.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2995" name="__module.model.layers.18.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3345,3347,hidden_states.557"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2996" name="__module.model.layers.18/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3350,3352,3363,hidden_states.559,hidden_states.561"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2997" name="Constant_1176021" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="4706845456" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2998" name="Constant_1176020" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2999" name="Constant_1176018" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3000" name="__module.model.layers.18.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3353"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3001" name="Constant_1104909" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3354"> <dim>1</dim> </port> </output> </layer> <layer id="3002" name="__module.model.layers.18.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3355,variance.75"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3003" name="Constant_1176019" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3004" name="__module.model.layers.18.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3356"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3005" name="__module.model.layers.18.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3006" name="__module.model.layers.18.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3357"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3007" name="__module.model.layers.18.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3358,3359,hidden_states.563,hidden_states.565"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3008" name="__module.model.layers.18.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3360,3362"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3009" name="self.model.layers.18.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="4706857744" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3010" name="Convert_1228892" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3011" name="self.model.layers.18.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="4777636624" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3012" name="Convert_1228895" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3013" name="self.model.layers.18.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3014" name="self.model.layers.18.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="4777659664" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3015" name="self.model.layers.18.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3016" name="__module.model.layers.18.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3017" name="__module.model.layers.18.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3368,input.37"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3018" name="__module.model.layers.18.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="3369"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3019" name="self.model.layers.18.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="4777705744" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3020" name="Convert_1228882" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3021" name="self.model.layers.18.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="4848484624" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3022" name="Convert_1228885" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3023" name="self.model.layers.18.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3024" name="self.model.layers.18.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="4848507664" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3025" name="self.model.layers.18.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3026" name="__module.model.layers.18.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3027" name="__module.model.layers.18.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3371"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3028" name="__module.model.layers.18.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3372"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3029" name="self.model.layers.18.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="4848553744" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3030" name="Convert_1228902" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3031" name="self.model.layers.18.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4919332624" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3032" name="Convert_1228905" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3033" name="self.model.layers.18.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3034" name="self.model.layers.18.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4919335696" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3035" name="self.model.layers.18.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3036" name="__module.model.layers.18.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3037" name="__module.model.layers.18.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3374,hidden_states.567"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3038" name="__module.model.layers.18/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3375,3377,3385,3396,hidden_states.569,hidden_states.571"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3039" name="Constant_1176025" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="4919341840" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3040" name="Constant_1176024" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3041" name="Constant_1176022" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3042" name="__module.model.layers.19.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3386"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3043" name="Constant_1104983" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3387"> <dim>1</dim> </port> </output> </layer> <layer id="3044" name="__module.model.layers.19.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3388,variance.77"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3045" name="Constant_1176023" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3046" name="__module.model.layers.19.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3389"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3047" name="__module.model.layers.19.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3048" name="__module.model.layers.19.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3390"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3049" name="__module.model.layers.19.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3391,3392,hidden_states.573,hidden_states.575"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3050" name="__module.model.layers.19.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3393,3395,hidden_states.577"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3051" name="self.model.layers.19.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="4919354128" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3052" name="Convert_1229922" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3053" name="self.model.layers.19.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4928791312" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3054" name="Convert_1229925" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3055" name="self.model.layers.19.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3056" name="self.model.layers.19.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4928794384" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3057" name="self.model.layers.19.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3058" name="__module.model.layers.19.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3059" name="__module.model.layers.19.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3404,query_states.39"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3060" name="Constant_1187812" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3061" name="__module.model.layers.19.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3410"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3062" name="__module.model.layers.19.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3063" name="__module.model.layers.19.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3411,q.39"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3064" name="__module.model.layers.19.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3420"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3065" name="Constant_1105380" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3066" name="Constant_1105382" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3067" name="Constant_1105384" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3068" name="__module.model.layers.19.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3430,x2.77"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3069" name="Constant_1176026" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3070" name="__module.model.layers.19.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3431"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3071" name="Constant_1105277" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3072" name="Constant_1105321" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3073" name="Constant_1105323" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3074" name="__module.model.layers.19.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3425"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3075" name="__module.model.layers.19.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3433"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3076" name="__module.model.layers.19.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3434"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3077" name="__module.model.layers.19.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3435"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3078" name="ReadValue_1190104" type="ReadValue" version="opset6"> <data variable_id="past_key_values.19.keypresent.19.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.19.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3079" name="Constant_1189489" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3080" name="Gather_1189490" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3081" name="self.model.layers.19.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="4928800528" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3082" name="Convert_1230732" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3083" name="self.model.layers.19.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="4931946256" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3084" name="Convert_1230735" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3085" name="self.model.layers.19.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3086" name="self.model.layers.19.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="4931947280" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3087" name="self.model.layers.19.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3088" name="__module.model.layers.19.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3089" name="__module.model.layers.19.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3406,key_states.81"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3090" name="Constant_1187813" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3091" name="__module.model.layers.19.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3413"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3092" name="__module.model.layers.19.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3093" name="__module.model.layers.19.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3414,k.39"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3094" name="__module.model.layers.19.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3436"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3095" name="Constant_1105523" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3096" name="Constant_1105525" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3097" name="Constant_1105527" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3098" name="__module.model.layers.19.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3446,x2.79"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3099" name="Constant_1176027" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3100" name="__module.model.layers.19.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3447"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3101" name="Constant_1105420" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3102" name="Constant_1105464" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3103" name="Constant_1105466" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3104" name="__module.model.layers.19.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3441"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3105" name="__module.model.layers.19.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3449"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3106" name="__module.model.layers.19.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3450"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3107" name="__module.model.layers.19.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3451"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3108" name="__module.model.layers.19.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3461,3462,hidden_states.579,present.19.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3109" name="__module.model.layers.19.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3463,3464,3465"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3110" name="__module.model.layers.19.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3467,hidden_states.581"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3111" name="Constant_1187814" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3112" name="__module.model.layers.19.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3471,key_states.83"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3113" name="ReadValue_1190106" type="ReadValue" version="opset6"> <data variable_id="past_key_values.19.valuepresent.19.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.19.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3114" name="Constant_1189492" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3115" name="Gather_1189493" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3116" name="self.model.layers.19.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="4931949328" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3117" name="Convert_1230722" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3118" name="self.model.layers.19.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="4935095056" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3119" name="Convert_1230725" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3120" name="self.model.layers.19.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3121" name="self.model.layers.19.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="4935096080" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3122" name="self.model.layers.19.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3123" name="__module.model.layers.19.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3124" name="__module.model.layers.19.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3408,value_states.39"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3125" name="Constant_1187815" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3126" name="__module.model.layers.19.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3416"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3127" name="__module.model.layers.19.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3128" name="__module.model.layers.19.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3417"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3129" name="__module.model.layers.19.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3477,3478,hidden_states.583,present.19.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3130" name="__module.model.layers.19.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3479,3480,3481"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3131" name="__module.model.layers.19.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3483,hidden_states.585"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3132" name="Constant_1187816" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3133" name="__module.model.layers.19.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3487"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3134" name="__module.model.layers.19.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3493,attn_output.77"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3135" name="__module.model.layers.19.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3136" name="__module.model.layers.19.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3494"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3137" name="__module.model.layers.19.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3497"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="3138" name="self.model.layers.19.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="4935098128" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3139" name="Convert_1229932" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3140" name="self.model.layers.19.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="4944535312" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3141" name="Convert_1229935" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3142" name="self.model.layers.19.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3143" name="self.model.layers.19.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="4944538384" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3144" name="self.model.layers.19.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3145" name="__module.model.layers.19.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3146" name="__module.model.layers.19.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3499,3501,hidden_states.587"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3147" name="__module.model.layers.19/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3504,3506,3517,hidden_states.589,hidden_states.591"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3148" name="Constant_1176031" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="4944544528" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3149" name="Constant_1176030" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3150" name="Constant_1176028" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3151" name="__module.model.layers.19.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3507"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3152" name="Constant_1106126" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3508"> <dim>1</dim> </port> </output> </layer> <layer id="3153" name="__module.model.layers.19.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3509,variance.79"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3154" name="Constant_1176029" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3155" name="__module.model.layers.19.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3510"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3156" name="__module.model.layers.19.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3157" name="__module.model.layers.19.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3511"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3158" name="__module.model.layers.19.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3512,3513,hidden_states.593,hidden_states.595"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3159" name="__module.model.layers.19.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3514,3516"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3160" name="self.model.layers.19.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="4944556816" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3161" name="Convert_1228922" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3162" name="self.model.layers.19.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="5015335696" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3163" name="Convert_1228925" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3164" name="self.model.layers.19.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3165" name="self.model.layers.19.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="5015358736" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3166" name="self.model.layers.19.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3167" name="__module.model.layers.19.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3168" name="__module.model.layers.19.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3522,input.39"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3169" name="__module.model.layers.19.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="3523"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3170" name="self.model.layers.19.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="5015404816" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3171" name="Convert_1228912" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3172" name="self.model.layers.19.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="5086183696" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3173" name="Convert_1228915" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3174" name="self.model.layers.19.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3175" name="self.model.layers.19.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="5086206736" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3176" name="self.model.layers.19.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3177" name="__module.model.layers.19.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3178" name="__module.model.layers.19.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3525"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3179" name="__module.model.layers.19.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3526"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3180" name="self.model.layers.19.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="5086252816" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3181" name="Convert_1228932" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3182" name="self.model.layers.19.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5157031696" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3183" name="Convert_1228935" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3184" name="self.model.layers.19.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3185" name="self.model.layers.19.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5157034768" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3186" name="self.model.layers.19.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3187" name="__module.model.layers.19.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3188" name="__module.model.layers.19.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3528,hidden_states.597"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3189" name="__module.model.layers.19/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3529,3531,3539,3550,hidden_states.599,hidden_states.601"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3190" name="Constant_1176035" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="5157040912" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3191" name="Constant_1176034" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3192" name="Constant_1176032" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3193" name="__module.model.layers.20.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3540"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3194" name="Constant_1106200" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3541"> <dim>1</dim> </port> </output> </layer> <layer id="3195" name="__module.model.layers.20.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3542,variance.81"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3196" name="Constant_1176033" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3197" name="__module.model.layers.20.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3543"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3198" name="__module.model.layers.20.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3199" name="__module.model.layers.20.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3544"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3200" name="__module.model.layers.20.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3545,3546,hidden_states.603,hidden_states.605"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3201" name="__module.model.layers.20.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3547,3549,hidden_states.607"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3202" name="self.model.layers.20.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="5157053200" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3203" name="Convert_1229942" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3204" name="self.model.layers.20.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5166490384" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3205" name="Convert_1229945" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3206" name="self.model.layers.20.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3207" name="self.model.layers.20.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5166493456" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3208" name="self.model.layers.20.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3209" name="__module.model.layers.20.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3210" name="__module.model.layers.20.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3558,query_states.41"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3211" name="Constant_1187817" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3212" name="__module.model.layers.20.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3564"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3213" name="__module.model.layers.20.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3214" name="__module.model.layers.20.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3565,q.41"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3215" name="__module.model.layers.20.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3574"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3216" name="Constant_1106597" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3217" name="Constant_1106599" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3218" name="Constant_1106601" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3219" name="__module.model.layers.20.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3584,x2.81"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3220" name="Constant_1176036" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3221" name="__module.model.layers.20.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3585"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3222" name="Constant_1106494" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3223" name="Constant_1106538" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3224" name="Constant_1106540" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3225" name="__module.model.layers.20.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3579"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3226" name="__module.model.layers.20.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3587"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3227" name="__module.model.layers.20.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3588"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3228" name="__module.model.layers.20.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3589"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3229" name="ReadValue_1190112" type="ReadValue" version="opset6"> <data variable_id="past_key_values.20.keypresent.20.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.20.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3230" name="Constant_1189495" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3231" name="Gather_1189496" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3232" name="self.model.layers.20.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="5166499600" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3233" name="Convert_1230752" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3234" name="self.model.layers.20.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="5169645328" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3235" name="Convert_1230755" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3236" name="self.model.layers.20.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3237" name="self.model.layers.20.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="5169646352" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3238" name="self.model.layers.20.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3239" name="__module.model.layers.20.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3240" name="__module.model.layers.20.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3560,key_states.85"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3241" name="Constant_1187818" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3242" name="__module.model.layers.20.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3567"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3243" name="__module.model.layers.20.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3244" name="__module.model.layers.20.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3568,k.41"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3245" name="__module.model.layers.20.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3590"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3246" name="Constant_1106740" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3247" name="Constant_1106742" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3248" name="Constant_1106744" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3249" name="__module.model.layers.20.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3600,x2.83"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3250" name="Constant_1176037" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3251" name="__module.model.layers.20.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3601"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3252" name="Constant_1106637" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3253" name="Constant_1106681" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3254" name="Constant_1106683" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3255" name="__module.model.layers.20.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3595"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3256" name="__module.model.layers.20.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3603"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3257" name="__module.model.layers.20.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3604"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3258" name="__module.model.layers.20.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3605"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3259" name="__module.model.layers.20.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3615,3616,hidden_states.609,present.20.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3260" name="__module.model.layers.20.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3617,3618,3619"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3261" name="__module.model.layers.20.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3621,hidden_states.611"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3262" name="Constant_1187819" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3263" name="__module.model.layers.20.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3625,key_states.87"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3264" name="ReadValue_1190114" type="ReadValue" version="opset6"> <data variable_id="past_key_values.20.valuepresent.20.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.20.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3265" name="Constant_1189498" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3266" name="Gather_1189499" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3267" name="self.model.layers.20.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="5169648400" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3268" name="Convert_1230742" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3269" name="self.model.layers.20.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="5172794128" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3270" name="Convert_1230745" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3271" name="self.model.layers.20.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3272" name="self.model.layers.20.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="5172795152" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3273" name="self.model.layers.20.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3274" name="__module.model.layers.20.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3275" name="__module.model.layers.20.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3562,value_states.41"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3276" name="Constant_1187820" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3277" name="__module.model.layers.20.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3570"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3278" name="__module.model.layers.20.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3279" name="__module.model.layers.20.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3571"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3280" name="__module.model.layers.20.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3631,3632,hidden_states.613,present.20.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3281" name="__module.model.layers.20.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3633,3634,3635"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3282" name="__module.model.layers.20.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3637,hidden_states.615"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3283" name="Constant_1187821" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3284" name="__module.model.layers.20.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3641"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3285" name="__module.model.layers.20.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3647,attn_output.81"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3286" name="__module.model.layers.20.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3287" name="__module.model.layers.20.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3648"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3288" name="__module.model.layers.20.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3651"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="3289" name="self.model.layers.20.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="5172797200" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3290" name="Convert_1229952" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3291" name="self.model.layers.20.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5182234384" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3292" name="Convert_1229955" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3293" name="self.model.layers.20.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3294" name="self.model.layers.20.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5182237456" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3295" name="self.model.layers.20.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3296" name="__module.model.layers.20.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3297" name="__module.model.layers.20.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3653,3655,hidden_states.617"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3298" name="__module.model.layers.20/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3658,3660,3671,hidden_states.619,hidden_states.621"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3299" name="Constant_1176041" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="5182243600" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3300" name="Constant_1176040" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3301" name="Constant_1176038" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3302" name="__module.model.layers.20.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3661"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3303" name="Constant_1107343" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3662"> <dim>1</dim> </port> </output> </layer> <layer id="3304" name="__module.model.layers.20.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3663,variance.83"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3305" name="Constant_1176039" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3306" name="__module.model.layers.20.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3664"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3307" name="__module.model.layers.20.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3308" name="__module.model.layers.20.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3665"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3309" name="__module.model.layers.20.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3666,3667,hidden_states.623,hidden_states.625"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3310" name="__module.model.layers.20.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3668,3670"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3311" name="self.model.layers.20.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="5182255888" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3312" name="Convert_1228952" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3313" name="self.model.layers.20.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="5253034768" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3314" name="Convert_1228955" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3315" name="self.model.layers.20.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3316" name="self.model.layers.20.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="5253057808" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3317" name="self.model.layers.20.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3318" name="__module.model.layers.20.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3319" name="__module.model.layers.20.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3676,input.41"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3320" name="__module.model.layers.20.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="3677"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3321" name="self.model.layers.20.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="5253103888" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3322" name="Convert_1228942" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3323" name="self.model.layers.20.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="5323882768" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3324" name="Convert_1228945" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3325" name="self.model.layers.20.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3326" name="self.model.layers.20.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="5323905808" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3327" name="self.model.layers.20.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3328" name="__module.model.layers.20.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3329" name="__module.model.layers.20.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3679"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3330" name="__module.model.layers.20.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3680"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3331" name="self.model.layers.20.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="5323951888" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3332" name="Convert_1228962" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3333" name="self.model.layers.20.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5394730768" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3334" name="Convert_1228965" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3335" name="self.model.layers.20.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3336" name="self.model.layers.20.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5394733840" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3337" name="self.model.layers.20.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3338" name="__module.model.layers.20.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3339" name="__module.model.layers.20.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3682,hidden_states.627"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3340" name="__module.model.layers.20/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3683,3685,3693,3704,hidden_states.629,hidden_states.631"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3341" name="Constant_1176045" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="5394739984" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3342" name="Constant_1176044" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3343" name="Constant_1176042" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3344" name="__module.model.layers.21.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3694"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3345" name="Constant_1107417" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3695"> <dim>1</dim> </port> </output> </layer> <layer id="3346" name="__module.model.layers.21.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3696,variance.85"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3347" name="Constant_1176043" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3348" name="__module.model.layers.21.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3697"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3349" name="__module.model.layers.21.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3350" name="__module.model.layers.21.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3698"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3351" name="__module.model.layers.21.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3699,3700,hidden_states.633,hidden_states.635"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3352" name="__module.model.layers.21.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3701,3703,hidden_states.637"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3353" name="self.model.layers.21.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="5394752272" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3354" name="Convert_1229962" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3355" name="self.model.layers.21.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5404189456" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3356" name="Convert_1229965" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3357" name="self.model.layers.21.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3358" name="self.model.layers.21.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5404192528" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3359" name="self.model.layers.21.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3360" name="__module.model.layers.21.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3361" name="__module.model.layers.21.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3712,query_states.43"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3362" name="Constant_1187822" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3363" name="__module.model.layers.21.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3718"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3364" name="__module.model.layers.21.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3365" name="__module.model.layers.21.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3719,q.43"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3366" name="__module.model.layers.21.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3728"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3367" name="Constant_1107814" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3368" name="Constant_1107816" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3369" name="Constant_1107818" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3370" name="__module.model.layers.21.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3738,x2.85"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3371" name="Constant_1176046" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3372" name="__module.model.layers.21.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3739"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3373" name="Constant_1107711" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3374" name="Constant_1107755" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3375" name="Constant_1107757" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3376" name="__module.model.layers.21.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3733"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3377" name="__module.model.layers.21.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3741"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3378" name="__module.model.layers.21.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3742"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3379" name="__module.model.layers.21.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3743"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3380" name="ReadValue_1190116" type="ReadValue" version="opset6"> <data variable_id="past_key_values.21.keypresent.21.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.21.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3381" name="Constant_1189501" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3382" name="Gather_1189502" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3383" name="self.model.layers.21.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="5404198672" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3384" name="Convert_1230772" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3385" name="self.model.layers.21.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="5407344400" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3386" name="Convert_1230775" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3387" name="self.model.layers.21.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3388" name="self.model.layers.21.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="5407345424" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3389" name="self.model.layers.21.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3390" name="__module.model.layers.21.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3391" name="__module.model.layers.21.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3714,key_states.89"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3392" name="Constant_1187823" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3393" name="__module.model.layers.21.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3721"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3394" name="__module.model.layers.21.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3395" name="__module.model.layers.21.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3722,k.43"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3396" name="__module.model.layers.21.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3744"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3397" name="Constant_1107957" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3398" name="Constant_1107959" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3399" name="Constant_1107961" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3400" name="__module.model.layers.21.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3754,x2.87"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3401" name="Constant_1176047" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3402" name="__module.model.layers.21.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3755"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3403" name="Constant_1107854" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3404" name="Constant_1107898" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3405" name="Constant_1107900" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3406" name="__module.model.layers.21.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3749"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3407" name="__module.model.layers.21.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3757"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3408" name="__module.model.layers.21.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3758"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3409" name="__module.model.layers.21.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3759"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3410" name="__module.model.layers.21.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3769,3770,hidden_states.639,present.21.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3411" name="__module.model.layers.21.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3771,3772,3773"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3412" name="__module.model.layers.21.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3775,hidden_states.641"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3413" name="Constant_1187824" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3414" name="__module.model.layers.21.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3779,key_states.91"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3415" name="ReadValue_1190118" type="ReadValue" version="opset6"> <data variable_id="past_key_values.21.valuepresent.21.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.21.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3416" name="Constant_1189504" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3417" name="Gather_1189505" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3418" name="self.model.layers.21.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="5407347472" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3419" name="Convert_1230762" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3420" name="self.model.layers.21.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="5410493200" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3421" name="Convert_1230765" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3422" name="self.model.layers.21.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3423" name="self.model.layers.21.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="5410494224" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3424" name="self.model.layers.21.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3425" name="__module.model.layers.21.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3426" name="__module.model.layers.21.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3716,value_states.43"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3427" name="Constant_1187825" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3428" name="__module.model.layers.21.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3724"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3429" name="__module.model.layers.21.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3430" name="__module.model.layers.21.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3725"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3431" name="__module.model.layers.21.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3785,3786,hidden_states.643,present.21.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3432" name="__module.model.layers.21.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3787,3788,3789"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3433" name="__module.model.layers.21.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3791,hidden_states.645"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3434" name="Constant_1187826" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3435" name="__module.model.layers.21.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3795"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3436" name="__module.model.layers.21.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3801,attn_output.85"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3437" name="__module.model.layers.21.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3438" name="__module.model.layers.21.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3802"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3439" name="__module.model.layers.21.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3805"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="3440" name="self.model.layers.21.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="5410496272" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3441" name="Convert_1229972" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3442" name="self.model.layers.21.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5419933456" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3443" name="Convert_1229975" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3444" name="self.model.layers.21.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3445" name="self.model.layers.21.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5419936528" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3446" name="self.model.layers.21.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3447" name="__module.model.layers.21.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3448" name="__module.model.layers.21.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3807,3809,hidden_states.647"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3449" name="__module.model.layers.21/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3812,3814,3825,hidden_states.649,hidden_states.651"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3450" name="Constant_1176051" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="5419942672" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3451" name="Constant_1176050" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3452" name="Constant_1176048" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3453" name="__module.model.layers.21.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3815"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3454" name="Constant_1108560" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3816"> <dim>1</dim> </port> </output> </layer> <layer id="3455" name="__module.model.layers.21.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3817,variance.87"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3456" name="Constant_1176049" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3457" name="__module.model.layers.21.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3818"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3458" name="__module.model.layers.21.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3459" name="__module.model.layers.21.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3819"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3460" name="__module.model.layers.21.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3820,3821,hidden_states.653,hidden_states.655"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3461" name="__module.model.layers.21.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3822,3824"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3462" name="self.model.layers.21.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="5419954960" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3463" name="Convert_1228982" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3464" name="self.model.layers.21.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="5490733840" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3465" name="Convert_1228985" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3466" name="self.model.layers.21.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3467" name="self.model.layers.21.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="5490756880" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3468" name="self.model.layers.21.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3469" name="__module.model.layers.21.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3470" name="__module.model.layers.21.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3830,input.43"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3471" name="__module.model.layers.21.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="3831"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3472" name="self.model.layers.21.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="5490802960" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3473" name="Convert_1228972" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3474" name="self.model.layers.21.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="5561581840" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3475" name="Convert_1228975" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3476" name="self.model.layers.21.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3477" name="self.model.layers.21.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="5561604880" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3478" name="self.model.layers.21.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3479" name="__module.model.layers.21.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3480" name="__module.model.layers.21.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3833"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3481" name="__module.model.layers.21.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3834"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3482" name="self.model.layers.21.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="5561650960" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3483" name="Convert_1228992" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3484" name="self.model.layers.21.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5632429840" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3485" name="Convert_1228995" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3486" name="self.model.layers.21.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3487" name="self.model.layers.21.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5632432912" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3488" name="self.model.layers.21.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3489" name="__module.model.layers.21.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3490" name="__module.model.layers.21.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3836,hidden_states.657"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3491" name="__module.model.layers.21/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3837,3839,3847,3858,hidden_states.659,hidden_states.661"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3492" name="Constant_1176055" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="5632439056" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3493" name="Constant_1176054" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3494" name="Constant_1176052" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3495" name="__module.model.layers.22.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3848"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3496" name="Constant_1108634" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3849"> <dim>1</dim> </port> </output> </layer> <layer id="3497" name="__module.model.layers.22.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3850,variance.89"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3498" name="Constant_1176053" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3499" name="__module.model.layers.22.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3851"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3500" name="__module.model.layers.22.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3501" name="__module.model.layers.22.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3852"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3502" name="__module.model.layers.22.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3853,3854,hidden_states.663,hidden_states.665"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3503" name="__module.model.layers.22.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3855,3857,hidden_states.667"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3504" name="self.model.layers.22.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="5632451344" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3505" name="Convert_1229982" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3506" name="self.model.layers.22.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5641888528" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3507" name="Convert_1229985" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3508" name="self.model.layers.22.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3509" name="self.model.layers.22.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5641891600" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3510" name="self.model.layers.22.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3511" name="__module.model.layers.22.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3512" name="__module.model.layers.22.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3866,query_states.45"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3513" name="Constant_1187827" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3514" name="__module.model.layers.22.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3872"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3515" name="__module.model.layers.22.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3516" name="__module.model.layers.22.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3873,q.45"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3517" name="__module.model.layers.22.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3882"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3518" name="Constant_1109031" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3519" name="Constant_1109033" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3520" name="Constant_1109035" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3521" name="__module.model.layers.22.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3892,x2.89"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3522" name="Constant_1176056" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3523" name="__module.model.layers.22.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3893"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3524" name="Constant_1108928" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3525" name="Constant_1108972" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3526" name="Constant_1108974" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3527" name="__module.model.layers.22.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3887"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3528" name="__module.model.layers.22.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3895"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3529" name="__module.model.layers.22.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3896"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3530" name="__module.model.layers.22.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3897"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3531" name="ReadValue_1190120" type="ReadValue" version="opset6"> <data variable_id="past_key_values.22.keypresent.22.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.22.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3532" name="Constant_1189507" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3533" name="Gather_1189508" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3534" name="self.model.layers.22.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="5641897744" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3535" name="Convert_1230792" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3536" name="self.model.layers.22.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="5645043472" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3537" name="Convert_1230795" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3538" name="self.model.layers.22.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3539" name="self.model.layers.22.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="5645044496" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3540" name="self.model.layers.22.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3541" name="__module.model.layers.22.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3542" name="__module.model.layers.22.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3868,key_states.93"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3543" name="Constant_1187828" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3544" name="__module.model.layers.22.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3875"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3545" name="__module.model.layers.22.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3546" name="__module.model.layers.22.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3876,k.45"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3547" name="__module.model.layers.22.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3898"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3548" name="Constant_1109174" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3549" name="Constant_1109176" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3550" name="Constant_1109178" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3551" name="__module.model.layers.22.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3908,x2.91"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3552" name="Constant_1176057" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3553" name="__module.model.layers.22.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3909"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3554" name="Constant_1109071" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3555" name="Constant_1109115" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3556" name="Constant_1109117" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3557" name="__module.model.layers.22.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3903"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3558" name="__module.model.layers.22.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="3911"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3559" name="__module.model.layers.22.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3912"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3560" name="__module.model.layers.22.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3913"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3561" name="__module.model.layers.22.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3923,3924,hidden_states.669,present.22.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3562" name="__module.model.layers.22.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3925,3926,3927"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3563" name="__module.model.layers.22.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3929,hidden_states.671"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3564" name="Constant_1187829" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3565" name="__module.model.layers.22.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3933,key_states.95"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3566" name="ReadValue_1190122" type="ReadValue" version="opset6"> <data variable_id="past_key_values.22.valuepresent.22.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.22.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3567" name="Constant_1189510" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3568" name="Gather_1189511" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3569" name="self.model.layers.22.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="5645046544" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3570" name="Convert_1230782" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3571" name="self.model.layers.22.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="5648192272" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3572" name="Convert_1230785" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3573" name="self.model.layers.22.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3574" name="self.model.layers.22.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="5648193296" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3575" name="self.model.layers.22.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3576" name="__module.model.layers.22.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3577" name="__module.model.layers.22.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3870,value_states.45"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3578" name="Constant_1187830" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3579" name="__module.model.layers.22.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3878"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3580" name="__module.model.layers.22.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3581" name="__module.model.layers.22.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3879"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3582" name="__module.model.layers.22.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="3939,3940,hidden_states.673,present.22.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3583" name="__module.model.layers.22.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="3941,3942,3943"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3584" name="__module.model.layers.22.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="3945,hidden_states.675"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3585" name="Constant_1187831" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3586" name="__module.model.layers.22.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3949"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3587" name="__module.model.layers.22.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3955,attn_output.89"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3588" name="__module.model.layers.22.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3589" name="__module.model.layers.22.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3956"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3590" name="__module.model.layers.22.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3959"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="3591" name="self.model.layers.22.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="5648195344" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3592" name="Convert_1229992" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3593" name="self.model.layers.22.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5657632528" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3594" name="Convert_1229995" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3595" name="self.model.layers.22.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3596" name="self.model.layers.22.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5657635600" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3597" name="self.model.layers.22.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3598" name="__module.model.layers.22.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3599" name="__module.model.layers.22.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3961,3963,hidden_states.677"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3600" name="__module.model.layers.22/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3966,3968,3979,hidden_states.679,hidden_states.681"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3601" name="Constant_1176061" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="5657641744" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3602" name="Constant_1176060" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3603" name="Constant_1176058" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3604" name="__module.model.layers.22.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3969"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3605" name="Constant_1109777" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="3970"> <dim>1</dim> </port> </output> </layer> <layer id="3606" name="__module.model.layers.22.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3971,variance.91"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3607" name="Constant_1176059" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3608" name="__module.model.layers.22.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3972"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3609" name="__module.model.layers.22.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3610" name="__module.model.layers.22.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3973"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3611" name="__module.model.layers.22.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3974,3975,hidden_states.683,hidden_states.685"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3612" name="__module.model.layers.22.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3976,3978"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3613" name="self.model.layers.22.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="5657654032" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3614" name="Convert_1229012" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3615" name="self.model.layers.22.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="5728432912" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3616" name="Convert_1229015" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3617" name="self.model.layers.22.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3618" name="self.model.layers.22.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="5728455952" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3619" name="self.model.layers.22.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3620" name="__module.model.layers.22.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3621" name="__module.model.layers.22.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3984,input.45"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3622" name="__module.model.layers.22.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="3985"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3623" name="self.model.layers.22.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="5728502032" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3624" name="Convert_1229002" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3625" name="self.model.layers.22.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="5799280912" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3626" name="Convert_1229005" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3627" name="self.model.layers.22.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3628" name="self.model.layers.22.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="5799303952" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3629" name="self.model.layers.22.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3630" name="__module.model.layers.22.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3631" name="__module.model.layers.22.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3987"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3632" name="__module.model.layers.22.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3988"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3633" name="self.model.layers.22.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="5799350032" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3634" name="Convert_1229022" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3635" name="self.model.layers.22.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5870128912" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3636" name="Convert_1229025" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3637" name="self.model.layers.22.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3638" name="self.model.layers.22.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5870131984" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3639" name="self.model.layers.22.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3640" name="__module.model.layers.22.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3641" name="__module.model.layers.22.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="3990,hidden_states.687"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3642" name="__module.model.layers.22/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3991,3993,4001,4012,hidden_states.689,hidden_states.691"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3643" name="Constant_1176065" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="5870138128" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3644" name="Constant_1176064" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3645" name="Constant_1176062" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3646" name="__module.model.layers.23.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4002"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3647" name="Constant_1109851" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4003"> <dim>1</dim> </port> </output> </layer> <layer id="3648" name="__module.model.layers.23.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4004,variance.93"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3649" name="Constant_1176063" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3650" name="__module.model.layers.23.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4005"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3651" name="__module.model.layers.23.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3652" name="__module.model.layers.23.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4006"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3653" name="__module.model.layers.23.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4007,4008,hidden_states.693,hidden_states.695"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3654" name="__module.model.layers.23.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4009,4011,hidden_states.697"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3655" name="self.model.layers.23.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="5870150416" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3656" name="Convert_1230002" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3657" name="self.model.layers.23.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5879587600" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3658" name="Convert_1230005" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3659" name="self.model.layers.23.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3660" name="self.model.layers.23.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5879590672" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3661" name="self.model.layers.23.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3662" name="__module.model.layers.23.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3663" name="__module.model.layers.23.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4020,query_states.47"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3664" name="Constant_1187832" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3665" name="__module.model.layers.23.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4026"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3666" name="__module.model.layers.23.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3667" name="__module.model.layers.23.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4027,q.47"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3668" name="__module.model.layers.23.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4036"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3669" name="Constant_1110248" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3670" name="Constant_1110250" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3671" name="Constant_1110252" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3672" name="__module.model.layers.23.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4046,x2.93"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3673" name="Constant_1176066" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3674" name="__module.model.layers.23.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4047"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3675" name="Constant_1110145" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3676" name="Constant_1110189" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3677" name="Constant_1110191" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3678" name="__module.model.layers.23.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4041"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3679" name="__module.model.layers.23.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4049"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3680" name="__module.model.layers.23.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4050"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3681" name="__module.model.layers.23.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4051"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3682" name="ReadValue_1190124" type="ReadValue" version="opset6"> <data variable_id="past_key_values.23.keypresent.23.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.23.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3683" name="Constant_1189513" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3684" name="Gather_1189514" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3685" name="self.model.layers.23.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="5879596816" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3686" name="Convert_1230812" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3687" name="self.model.layers.23.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="5882742544" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3688" name="Convert_1230815" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3689" name="self.model.layers.23.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3690" name="self.model.layers.23.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="5882743568" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3691" name="self.model.layers.23.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3692" name="__module.model.layers.23.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3693" name="__module.model.layers.23.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4022,key_states.97"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3694" name="Constant_1187833" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3695" name="__module.model.layers.23.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4029"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3696" name="__module.model.layers.23.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3697" name="__module.model.layers.23.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4030,k.47"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3698" name="__module.model.layers.23.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4052"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3699" name="Constant_1110391" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3700" name="Constant_1110393" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3701" name="Constant_1110395" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3702" name="__module.model.layers.23.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4062,x2.95"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3703" name="Constant_1176067" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3704" name="__module.model.layers.23.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4063"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3705" name="Constant_1110288" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3706" name="Constant_1110332" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3707" name="Constant_1110334" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3708" name="__module.model.layers.23.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4057"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3709" name="__module.model.layers.23.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4065"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3710" name="__module.model.layers.23.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4066"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3711" name="__module.model.layers.23.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4067"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3712" name="__module.model.layers.23.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4077,4078,hidden_states.699,present.23.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3713" name="__module.model.layers.23.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4079,4080,4081"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3714" name="__module.model.layers.23.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4083,hidden_states.701"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3715" name="Constant_1187834" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3716" name="__module.model.layers.23.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4087,key_states.99"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3717" name="ReadValue_1190126" type="ReadValue" version="opset6"> <data variable_id="past_key_values.23.valuepresent.23.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.23.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3718" name="Constant_1189516" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3719" name="Gather_1189517" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3720" name="self.model.layers.23.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="5882745616" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3721" name="Convert_1230802" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3722" name="self.model.layers.23.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="5885891344" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3723" name="Convert_1230805" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3724" name="self.model.layers.23.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3725" name="self.model.layers.23.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="5885892368" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3726" name="self.model.layers.23.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3727" name="__module.model.layers.23.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3728" name="__module.model.layers.23.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4024,value_states.47"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3729" name="Constant_1187835" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3730" name="__module.model.layers.23.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4032"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3731" name="__module.model.layers.23.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3732" name="__module.model.layers.23.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4033"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3733" name="__module.model.layers.23.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4093,4094,hidden_states.703,present.23.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3734" name="__module.model.layers.23.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4095,4096,4097"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3735" name="__module.model.layers.23.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4099,hidden_states.705"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3736" name="Constant_1187836" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3737" name="__module.model.layers.23.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4103"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3738" name="__module.model.layers.23.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4109,attn_output.93"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3739" name="__module.model.layers.23.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3740" name="__module.model.layers.23.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4110"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3741" name="__module.model.layers.23.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4113"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="3742" name="self.model.layers.23.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="5885894416" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3743" name="Convert_1230012" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3744" name="self.model.layers.23.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="5895331600" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3745" name="Convert_1230015" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3746" name="self.model.layers.23.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3747" name="self.model.layers.23.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="5895334672" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3748" name="self.model.layers.23.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3749" name="__module.model.layers.23.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3750" name="__module.model.layers.23.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4115,4117,hidden_states.707"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3751" name="__module.model.layers.23/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4120,4122,4133,hidden_states.709,hidden_states.711"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3752" name="Constant_1176071" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="5895340816" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3753" name="Constant_1176070" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3754" name="Constant_1176068" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3755" name="__module.model.layers.23.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4123"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3756" name="Constant_1110994" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4124"> <dim>1</dim> </port> </output> </layer> <layer id="3757" name="__module.model.layers.23.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4125,variance.95"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3758" name="Constant_1176069" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3759" name="__module.model.layers.23.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4126"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3760" name="__module.model.layers.23.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3761" name="__module.model.layers.23.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4127"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3762" name="__module.model.layers.23.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4128,4129,hidden_states.713,hidden_states.715"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3763" name="__module.model.layers.23.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4130,4132"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3764" name="self.model.layers.23.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="5895353104" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3765" name="Convert_1229042" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3766" name="self.model.layers.23.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="5966131984" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3767" name="Convert_1229045" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3768" name="self.model.layers.23.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3769" name="self.model.layers.23.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="5966155024" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3770" name="self.model.layers.23.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3771" name="__module.model.layers.23.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3772" name="__module.model.layers.23.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4138,input.47"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3773" name="__module.model.layers.23.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="4139"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3774" name="self.model.layers.23.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="5966201104" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3775" name="Convert_1229032" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3776" name="self.model.layers.23.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="6036979984" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3777" name="Convert_1229035" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3778" name="self.model.layers.23.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3779" name="self.model.layers.23.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="6037003024" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3780" name="self.model.layers.23.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3781" name="__module.model.layers.23.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3782" name="__module.model.layers.23.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4141"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3783" name="__module.model.layers.23.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4142"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3784" name="self.model.layers.23.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="6037049104" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3785" name="Convert_1229052" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3786" name="self.model.layers.23.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6107827984" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3787" name="Convert_1229055" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3788" name="self.model.layers.23.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3789" name="self.model.layers.23.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6107831056" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3790" name="self.model.layers.23.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3791" name="__module.model.layers.23.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3792" name="__module.model.layers.23.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4144,hidden_states.717"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3793" name="__module.model.layers.23/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4145,4147,4155,4166,hidden_states.719,hidden_states.721"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3794" name="Constant_1176075" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="6107837200" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3795" name="Constant_1176074" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3796" name="Constant_1176072" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3797" name="__module.model.layers.24.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4156"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3798" name="Constant_1111068" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4157"> <dim>1</dim> </port> </output> </layer> <layer id="3799" name="__module.model.layers.24.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4158,variance.97"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3800" name="Constant_1176073" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3801" name="__module.model.layers.24.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4159"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3802" name="__module.model.layers.24.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3803" name="__module.model.layers.24.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4160"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3804" name="__module.model.layers.24.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4161,4162,hidden_states.723,hidden_states.725"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3805" name="__module.model.layers.24.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4163,4165,hidden_states.727"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3806" name="self.model.layers.24.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="6107849488" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3807" name="Convert_1230022" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3808" name="self.model.layers.24.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6117286672" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3809" name="Convert_1230025" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3810" name="self.model.layers.24.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3811" name="self.model.layers.24.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6117289744" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3812" name="self.model.layers.24.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3813" name="__module.model.layers.24.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3814" name="__module.model.layers.24.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4174,query_states.49"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3815" name="Constant_1187837" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3816" name="__module.model.layers.24.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4180"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3817" name="__module.model.layers.24.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3818" name="__module.model.layers.24.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4181,q.49"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3819" name="__module.model.layers.24.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4190"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3820" name="Constant_1111465" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3821" name="Constant_1111467" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3822" name="Constant_1111469" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3823" name="__module.model.layers.24.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4200,x2.97"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3824" name="Constant_1176076" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3825" name="__module.model.layers.24.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4201"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3826" name="Constant_1111362" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3827" name="Constant_1111406" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3828" name="Constant_1111408" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3829" name="__module.model.layers.24.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4195"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3830" name="__module.model.layers.24.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4203"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3831" name="__module.model.layers.24.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4204"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3832" name="__module.model.layers.24.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4205"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3833" name="ReadValue_1190128" type="ReadValue" version="opset6"> <data variable_id="past_key_values.24.keypresent.24.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.24.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3834" name="Constant_1189519" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3835" name="Gather_1189520" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3836" name="self.model.layers.24.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="6117295888" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3837" name="Convert_1230832" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3838" name="self.model.layers.24.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="6120441616" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3839" name="Convert_1230835" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3840" name="self.model.layers.24.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3841" name="self.model.layers.24.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="6120442640" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3842" name="self.model.layers.24.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3843" name="__module.model.layers.24.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3844" name="__module.model.layers.24.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4176,key_states.101"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3845" name="Constant_1187838" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3846" name="__module.model.layers.24.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4183"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3847" name="__module.model.layers.24.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3848" name="__module.model.layers.24.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4184,k.49"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3849" name="__module.model.layers.24.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4206"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3850" name="Constant_1111608" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3851" name="Constant_1111610" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3852" name="Constant_1111612" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3853" name="__module.model.layers.24.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4216,x2.99"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3854" name="Constant_1176077" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3855" name="__module.model.layers.24.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4217"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3856" name="Constant_1111505" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3857" name="Constant_1111549" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3858" name="Constant_1111551" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3859" name="__module.model.layers.24.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4211"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3860" name="__module.model.layers.24.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4219"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3861" name="__module.model.layers.24.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4220"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3862" name="__module.model.layers.24.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4221"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3863" name="__module.model.layers.24.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4231,4232,hidden_states.729,present.24.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3864" name="__module.model.layers.24.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4233,4234,4235"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3865" name="__module.model.layers.24.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4237,hidden_states.731"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3866" name="Constant_1187839" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3867" name="__module.model.layers.24.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4241,key_states.103"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3868" name="ReadValue_1190130" type="ReadValue" version="opset6"> <data variable_id="past_key_values.24.valuepresent.24.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.24.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3869" name="Constant_1189522" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3870" name="Gather_1189523" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3871" name="self.model.layers.24.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="6120444688" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3872" name="Convert_1230822" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3873" name="self.model.layers.24.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="6123590416" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3874" name="Convert_1230825" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3875" name="self.model.layers.24.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3876" name="self.model.layers.24.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="6123591440" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3877" name="self.model.layers.24.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3878" name="__module.model.layers.24.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3879" name="__module.model.layers.24.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4178,value_states.49"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3880" name="Constant_1187840" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3881" name="__module.model.layers.24.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4186"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3882" name="__module.model.layers.24.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3883" name="__module.model.layers.24.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4187"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3884" name="__module.model.layers.24.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4247,4248,hidden_states.733,present.24.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3885" name="__module.model.layers.24.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4249,4250,4251"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3886" name="__module.model.layers.24.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4253,hidden_states.735"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3887" name="Constant_1187841" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3888" name="__module.model.layers.24.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4257"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3889" name="__module.model.layers.24.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4263,attn_output.97"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3890" name="__module.model.layers.24.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3891" name="__module.model.layers.24.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4264"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3892" name="__module.model.layers.24.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4267"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="3893" name="self.model.layers.24.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="6123593488" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3894" name="Convert_1230032" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3895" name="self.model.layers.24.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6133030672" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3896" name="Convert_1230035" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3897" name="self.model.layers.24.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3898" name="self.model.layers.24.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6133033744" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3899" name="self.model.layers.24.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3900" name="__module.model.layers.24.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3901" name="__module.model.layers.24.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4269,4271,hidden_states.737"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3902" name="__module.model.layers.24/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4274,4276,4287,hidden_states.739,hidden_states.741"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3903" name="Constant_1176081" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="6133039888" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3904" name="Constant_1176080" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3905" name="Constant_1176078" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3906" name="__module.model.layers.24.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4277"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3907" name="Constant_1112211" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4278"> <dim>1</dim> </port> </output> </layer> <layer id="3908" name="__module.model.layers.24.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4279,variance.99"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3909" name="Constant_1176079" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3910" name="__module.model.layers.24.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4280"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3911" name="__module.model.layers.24.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3912" name="__module.model.layers.24.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4281"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3913" name="__module.model.layers.24.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4282,4283,hidden_states.743,hidden_states.745"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3914" name="__module.model.layers.24.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4284,4286"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3915" name="self.model.layers.24.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="6133052176" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3916" name="Convert_1229072" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3917" name="self.model.layers.24.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="6203831056" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3918" name="Convert_1229075" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3919" name="self.model.layers.24.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3920" name="self.model.layers.24.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="6203854096" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3921" name="self.model.layers.24.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3922" name="__module.model.layers.24.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3923" name="__module.model.layers.24.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4292,input.49"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3924" name="__module.model.layers.24.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="4293"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3925" name="self.model.layers.24.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="6203900176" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3926" name="Convert_1229062" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3927" name="self.model.layers.24.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="6274679056" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3928" name="Convert_1229065" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3929" name="self.model.layers.24.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3930" name="self.model.layers.24.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="6274702096" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="3931" name="self.model.layers.24.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3932" name="__module.model.layers.24.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3933" name="__module.model.layers.24.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4295"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3934" name="__module.model.layers.24.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4296"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3935" name="self.model.layers.24.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="6274748176" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3936" name="Convert_1229082" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3937" name="self.model.layers.24.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6345527056" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3938" name="Convert_1229085" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3939" name="self.model.layers.24.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3940" name="self.model.layers.24.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6345530128" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3941" name="self.model.layers.24.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3942" name="__module.model.layers.24.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="3943" name="__module.model.layers.24.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4298,hidden_states.747"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3944" name="__module.model.layers.24/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4299,4301,4309,4320,hidden_states.749,hidden_states.751"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3945" name="Constant_1176085" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="6345536272" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3946" name="Constant_1176084" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3947" name="Constant_1176082" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3948" name="__module.model.layers.25.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4310"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3949" name="Constant_1112285" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4311"> <dim>1</dim> </port> </output> </layer> <layer id="3950" name="__module.model.layers.25.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4312,variance.101"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3951" name="Constant_1176083" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3952" name="__module.model.layers.25.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4313"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3953" name="__module.model.layers.25.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3954" name="__module.model.layers.25.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4314"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3955" name="__module.model.layers.25.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4315,4316,hidden_states.753,hidden_states.755"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3956" name="__module.model.layers.25.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4317,4319,hidden_states.757"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3957" name="self.model.layers.25.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="6345548560" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3958" name="Convert_1230042" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3959" name="self.model.layers.25.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6354985744" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3960" name="Convert_1230045" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3961" name="self.model.layers.25.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3962" name="self.model.layers.25.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6354988816" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="3963" name="self.model.layers.25.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3964" name="__module.model.layers.25.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3965" name="__module.model.layers.25.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4328,query_states.51"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3966" name="Constant_1187842" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3967" name="__module.model.layers.25.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4334"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="3968" name="__module.model.layers.25.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3969" name="__module.model.layers.25.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4335,q.51"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3970" name="__module.model.layers.25.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4344"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3971" name="Constant_1112682" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3972" name="Constant_1112684" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3973" name="Constant_1112686" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3974" name="__module.model.layers.25.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4354,x2.101"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3975" name="Constant_1176086" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3976" name="__module.model.layers.25.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4355"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3977" name="Constant_1112579" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3978" name="Constant_1112623" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3979" name="Constant_1112625" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3980" name="__module.model.layers.25.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4349"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="3981" name="__module.model.layers.25.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4357"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3982" name="__module.model.layers.25.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4358"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3983" name="__module.model.layers.25.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4359"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3984" name="ReadValue_1190132" type="ReadValue" version="opset6"> <data variable_id="past_key_values.25.keypresent.25.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.25.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3985" name="Constant_1189525" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3986" name="Gather_1189526" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="3987" name="self.model.layers.25.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="6354994960" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3988" name="Convert_1230852" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3989" name="self.model.layers.25.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="6358140688" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3990" name="Convert_1230855" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3991" name="self.model.layers.25.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3992" name="self.model.layers.25.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="6358141712" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="3993" name="self.model.layers.25.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3994" name="__module.model.layers.25.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3995" name="__module.model.layers.25.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4330,key_states.105"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3996" name="Constant_1187843" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3997" name="__module.model.layers.25.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4337"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="3998" name="__module.model.layers.25.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3999" name="__module.model.layers.25.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4338,k.51"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4000" name="__module.model.layers.25.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4360"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4001" name="Constant_1112825" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4002" name="Constant_1112827" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4003" name="Constant_1112829" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4004" name="__module.model.layers.25.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4370,x2.103"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4005" name="Constant_1176087" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4006" name="__module.model.layers.25.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4371"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4007" name="Constant_1112722" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4008" name="Constant_1112766" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4009" name="Constant_1112768" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4010" name="__module.model.layers.25.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4365"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4011" name="__module.model.layers.25.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4373"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4012" name="__module.model.layers.25.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4374"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4013" name="__module.model.layers.25.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4375"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4014" name="__module.model.layers.25.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4385,4386,hidden_states.759,present.25.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4015" name="__module.model.layers.25.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4387,4388,4389"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4016" name="__module.model.layers.25.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4391,hidden_states.761"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4017" name="Constant_1187844" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4018" name="__module.model.layers.25.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4395,key_states.107"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4019" name="ReadValue_1190134" type="ReadValue" version="opset6"> <data variable_id="past_key_values.25.valuepresent.25.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.25.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4020" name="Constant_1189528" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4021" name="Gather_1189529" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4022" name="self.model.layers.25.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="6358143760" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4023" name="Convert_1230842" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4024" name="self.model.layers.25.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="6361289488" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4025" name="Convert_1230845" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4026" name="self.model.layers.25.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4027" name="self.model.layers.25.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="6361290512" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4028" name="self.model.layers.25.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4029" name="__module.model.layers.25.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4030" name="__module.model.layers.25.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4332,value_states.51"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4031" name="Constant_1187845" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4032" name="__module.model.layers.25.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4340"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4033" name="__module.model.layers.25.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4034" name="__module.model.layers.25.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4341"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4035" name="__module.model.layers.25.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4401,4402,hidden_states.763,present.25.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4036" name="__module.model.layers.25.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4403,4404,4405"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4037" name="__module.model.layers.25.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4407,hidden_states.765"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4038" name="Constant_1187846" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4039" name="__module.model.layers.25.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4411"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4040" name="__module.model.layers.25.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4417,attn_output.101"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4041" name="__module.model.layers.25.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4042" name="__module.model.layers.25.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4418"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4043" name="__module.model.layers.25.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4421"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="4044" name="self.model.layers.25.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="6361292560" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4045" name="Convert_1230052" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4046" name="self.model.layers.25.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6370729744" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4047" name="Convert_1230055" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4048" name="self.model.layers.25.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4049" name="self.model.layers.25.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6370732816" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4050" name="self.model.layers.25.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4051" name="__module.model.layers.25.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4052" name="__module.model.layers.25.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4423,4425,hidden_states.767"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4053" name="__module.model.layers.25/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4428,4430,4441,hidden_states.769,hidden_states.771"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4054" name="Constant_1176091" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="6370738960" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4055" name="Constant_1176090" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4056" name="Constant_1176088" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4057" name="__module.model.layers.25.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4431"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4058" name="Constant_1113428" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4432"> <dim>1</dim> </port> </output> </layer> <layer id="4059" name="__module.model.layers.25.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4433,variance.103"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4060" name="Constant_1176089" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4061" name="__module.model.layers.25.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4434"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4062" name="__module.model.layers.25.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4063" name="__module.model.layers.25.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4435"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4064" name="__module.model.layers.25.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4436,4437,hidden_states.773,hidden_states.775"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4065" name="__module.model.layers.25.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4438,4440"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4066" name="self.model.layers.25.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="6370751248" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4067" name="Convert_1229102" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4068" name="self.model.layers.25.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="6441530128" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4069" name="Convert_1229105" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4070" name="self.model.layers.25.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4071" name="self.model.layers.25.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="6441553168" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4072" name="self.model.layers.25.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4073" name="__module.model.layers.25.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4074" name="__module.model.layers.25.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4446,input.51"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4075" name="__module.model.layers.25.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="4447"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4076" name="self.model.layers.25.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="6441599248" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4077" name="Convert_1229092" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4078" name="self.model.layers.25.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="6512378128" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4079" name="Convert_1229095" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4080" name="self.model.layers.25.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4081" name="self.model.layers.25.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="6512401168" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4082" name="self.model.layers.25.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4083" name="__module.model.layers.25.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4084" name="__module.model.layers.25.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4449"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4085" name="__module.model.layers.25.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4450"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4086" name="self.model.layers.25.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="6512447248" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4087" name="Convert_1229112" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4088" name="self.model.layers.25.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6583226128" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4089" name="Convert_1229115" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4090" name="self.model.layers.25.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4091" name="self.model.layers.25.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6583229200" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4092" name="self.model.layers.25.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4093" name="__module.model.layers.25.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4094" name="__module.model.layers.25.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4452,hidden_states.777"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4095" name="__module.model.layers.25/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4453,4455,4463,4474,hidden_states.779,hidden_states.781"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4096" name="Constant_1176095" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="6583235344" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4097" name="Constant_1176094" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4098" name="Constant_1176092" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4099" name="__module.model.layers.26.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4464"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4100" name="Constant_1113502" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4465"> <dim>1</dim> </port> </output> </layer> <layer id="4101" name="__module.model.layers.26.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4466,variance.105"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4102" name="Constant_1176093" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4103" name="__module.model.layers.26.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4467"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4104" name="__module.model.layers.26.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4105" name="__module.model.layers.26.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4468"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4106" name="__module.model.layers.26.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4469,4470,hidden_states.783,hidden_states.785"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4107" name="__module.model.layers.26.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4471,4473,hidden_states.787"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4108" name="self.model.layers.26.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="6583247632" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4109" name="Convert_1230062" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4110" name="self.model.layers.26.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6592684816" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4111" name="Convert_1230065" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4112" name="self.model.layers.26.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4113" name="self.model.layers.26.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6592687888" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4114" name="self.model.layers.26.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4115" name="__module.model.layers.26.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4116" name="__module.model.layers.26.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4482,query_states.53"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4117" name="Constant_1187847" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4118" name="__module.model.layers.26.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4488"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4119" name="__module.model.layers.26.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4120" name="__module.model.layers.26.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4489,q.53"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4121" name="__module.model.layers.26.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4498"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4122" name="Constant_1113899" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4123" name="Constant_1113901" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4124" name="Constant_1113903" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4125" name="__module.model.layers.26.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4508,x2.105"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4126" name="Constant_1176096" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4127" name="__module.model.layers.26.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4509"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4128" name="Constant_1113796" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4129" name="Constant_1113840" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4130" name="Constant_1113842" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4131" name="__module.model.layers.26.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4503"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4132" name="__module.model.layers.26.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4511"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4133" name="__module.model.layers.26.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4512"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4134" name="__module.model.layers.26.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4513"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4135" name="ReadValue_1190136" type="ReadValue" version="opset6"> <data variable_id="past_key_values.26.keypresent.26.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.26.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4136" name="Constant_1189531" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4137" name="Gather_1189532" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4138" name="self.model.layers.26.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="6592694032" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4139" name="Convert_1230872" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4140" name="self.model.layers.26.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="6595839760" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4141" name="Convert_1230875" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4142" name="self.model.layers.26.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4143" name="self.model.layers.26.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="6595840784" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4144" name="self.model.layers.26.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4145" name="__module.model.layers.26.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4146" name="__module.model.layers.26.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4484,key_states.109"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4147" name="Constant_1187848" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4148" name="__module.model.layers.26.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4491"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4149" name="__module.model.layers.26.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4150" name="__module.model.layers.26.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4492,k.53"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4151" name="__module.model.layers.26.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4514"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4152" name="Constant_1114042" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4153" name="Constant_1114044" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4154" name="Constant_1114046" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4155" name="__module.model.layers.26.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4524,x2.107"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4156" name="Constant_1176097" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4157" name="__module.model.layers.26.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4525"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4158" name="Constant_1113939" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4159" name="Constant_1113983" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4160" name="Constant_1113985" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4161" name="__module.model.layers.26.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4519"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4162" name="__module.model.layers.26.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4527"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4163" name="__module.model.layers.26.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4528"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4164" name="__module.model.layers.26.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4529"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4165" name="__module.model.layers.26.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4539,4540,hidden_states.789,present.26.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4166" name="__module.model.layers.26.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4541,4542,4543"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4167" name="__module.model.layers.26.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4545,hidden_states.791"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4168" name="Constant_1187849" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4169" name="__module.model.layers.26.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4549,key_states.111"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4170" name="ReadValue_1190138" type="ReadValue" version="opset6"> <data variable_id="past_key_values.26.valuepresent.26.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.26.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4171" name="Constant_1189534" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4172" name="Gather_1189535" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4173" name="self.model.layers.26.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="6595842832" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4174" name="Convert_1230862" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4175" name="self.model.layers.26.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="6598988560" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4176" name="Convert_1230865" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4177" name="self.model.layers.26.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4178" name="self.model.layers.26.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="6598989584" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4179" name="self.model.layers.26.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4180" name="__module.model.layers.26.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4181" name="__module.model.layers.26.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4486,value_states.53"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4182" name="Constant_1187850" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4183" name="__module.model.layers.26.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4494"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4184" name="__module.model.layers.26.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4185" name="__module.model.layers.26.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4495"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4186" name="__module.model.layers.26.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4555,4556,hidden_states.793,present.26.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4187" name="__module.model.layers.26.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4557,4558,4559"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4188" name="__module.model.layers.26.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4561,hidden_states.795"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4189" name="Constant_1187851" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4190" name="__module.model.layers.26.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4565"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4191" name="__module.model.layers.26.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4571,attn_output.105"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4192" name="__module.model.layers.26.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4193" name="__module.model.layers.26.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4572"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4194" name="__module.model.layers.26.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4575"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="4195" name="self.model.layers.26.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="6598991632" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4196" name="Convert_1230072" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4197" name="self.model.layers.26.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6608428816" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4198" name="Convert_1230075" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4199" name="self.model.layers.26.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4200" name="self.model.layers.26.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6608431888" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4201" name="self.model.layers.26.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4202" name="__module.model.layers.26.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4203" name="__module.model.layers.26.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4577,4579,hidden_states.797"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4204" name="__module.model.layers.26/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4582,4584,4595,hidden_states.799,hidden_states.801"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4205" name="Constant_1176101" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="6608438032" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4206" name="Constant_1176100" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4207" name="Constant_1176098" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4208" name="__module.model.layers.26.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4585"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4209" name="Constant_1114645" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4586"> <dim>1</dim> </port> </output> </layer> <layer id="4210" name="__module.model.layers.26.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4587,variance.107"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4211" name="Constant_1176099" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4212" name="__module.model.layers.26.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4588"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4213" name="__module.model.layers.26.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4214" name="__module.model.layers.26.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4589"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4215" name="__module.model.layers.26.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4590,4591,hidden_states.803,hidden_states.805"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4216" name="__module.model.layers.26.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4592,4594"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4217" name="self.model.layers.26.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="6608450320" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4218" name="Convert_1229132" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4219" name="self.model.layers.26.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="6679229200" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4220" name="Convert_1229135" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4221" name="self.model.layers.26.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4222" name="self.model.layers.26.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="6679252240" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4223" name="self.model.layers.26.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4224" name="__module.model.layers.26.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4225" name="__module.model.layers.26.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4600,input.53"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4226" name="__module.model.layers.26.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="4601"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4227" name="self.model.layers.26.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="6679298320" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4228" name="Convert_1229122" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4229" name="self.model.layers.26.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="6750077200" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4230" name="Convert_1229125" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4231" name="self.model.layers.26.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4232" name="self.model.layers.26.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="6750100240" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4233" name="self.model.layers.26.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4234" name="__module.model.layers.26.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4235" name="__module.model.layers.26.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4603"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4236" name="__module.model.layers.26.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4604"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4237" name="self.model.layers.26.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="6750146320" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4238" name="Convert_1229142" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4239" name="self.model.layers.26.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6820925200" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4240" name="Convert_1229145" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4241" name="self.model.layers.26.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4242" name="self.model.layers.26.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6820928272" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4243" name="self.model.layers.26.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4244" name="__module.model.layers.26.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4245" name="__module.model.layers.26.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4606,hidden_states.807"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4246" name="__module.model.layers.26/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4607,4609,4617,4628,hidden_states.809,hidden_states.811"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4247" name="Constant_1176105" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="6820934416" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4248" name="Constant_1176104" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4249" name="Constant_1176102" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4250" name="__module.model.layers.27.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4618"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4251" name="Constant_1114719" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4619"> <dim>1</dim> </port> </output> </layer> <layer id="4252" name="__module.model.layers.27.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4620,variance.109"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4253" name="Constant_1176103" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4254" name="__module.model.layers.27.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4621"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4255" name="__module.model.layers.27.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4256" name="__module.model.layers.27.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4622"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4257" name="__module.model.layers.27.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4623,4624,hidden_states.813,hidden_states.815"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4258" name="__module.model.layers.27.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4625,4627,hidden_states.817"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4259" name="self.model.layers.27.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="6820946704" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4260" name="Convert_1230082" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4261" name="self.model.layers.27.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6830383888" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4262" name="Convert_1230085" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4263" name="self.model.layers.27.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4264" name="self.model.layers.27.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6830386960" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4265" name="self.model.layers.27.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4266" name="__module.model.layers.27.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4267" name="__module.model.layers.27.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4636,query_states.55"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4268" name="Constant_1187852" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4269" name="__module.model.layers.27.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4642"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4270" name="__module.model.layers.27.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4271" name="__module.model.layers.27.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4643,q.55"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4272" name="__module.model.layers.27.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4652"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4273" name="Constant_1115116" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4274" name="Constant_1115118" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4275" name="Constant_1115120" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4276" name="__module.model.layers.27.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4662,x2.109"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4277" name="Constant_1176106" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4278" name="__module.model.layers.27.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4663"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4279" name="Constant_1115013" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4280" name="Constant_1115057" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4281" name="Constant_1115059" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4282" name="__module.model.layers.27.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4657"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4283" name="__module.model.layers.27.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4665"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4284" name="__module.model.layers.27.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4666"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4285" name="__module.model.layers.27.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4667"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4286" name="ReadValue_1190140" type="ReadValue" version="opset6"> <data variable_id="past_key_values.27.keypresent.27.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.27.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4287" name="Constant_1189537" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4288" name="Gather_1189538" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4289" name="self.model.layers.27.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="6830393104" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4290" name="Convert_1230892" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4291" name="self.model.layers.27.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="6833538832" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4292" name="Convert_1230895" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4293" name="self.model.layers.27.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4294" name="self.model.layers.27.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="6833539856" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4295" name="self.model.layers.27.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4296" name="__module.model.layers.27.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4297" name="__module.model.layers.27.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4638,key_states.113"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4298" name="Constant_1187853" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4299" name="__module.model.layers.27.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4645"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4300" name="__module.model.layers.27.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4301" name="__module.model.layers.27.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4646,k.55"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4302" name="__module.model.layers.27.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4668"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4303" name="Constant_1115259" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4304" name="Constant_1115261" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4305" name="Constant_1115263" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4306" name="__module.model.layers.27.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4678,x2.111"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4307" name="Constant_1176107" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4308" name="__module.model.layers.27.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4679"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4309" name="Constant_1115156" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4310" name="Constant_1115200" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4311" name="Constant_1115202" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4312" name="__module.model.layers.27.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4673"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4313" name="__module.model.layers.27.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4681"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4314" name="__module.model.layers.27.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4682"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4315" name="__module.model.layers.27.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4683"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4316" name="__module.model.layers.27.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4693,4694,hidden_states.819,present.27.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4317" name="__module.model.layers.27.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4695,4696,4697"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4318" name="__module.model.layers.27.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4699,hidden_states.821"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4319" name="Constant_1187854" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4320" name="__module.model.layers.27.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4703,key_states.115"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4321" name="ReadValue_1190142" type="ReadValue" version="opset6"> <data variable_id="past_key_values.27.valuepresent.27.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.27.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4322" name="Constant_1189540" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4323" name="Gather_1189541" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4324" name="self.model.layers.27.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="6833541904" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4325" name="Convert_1230882" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4326" name="self.model.layers.27.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="6836687632" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4327" name="Convert_1230885" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4328" name="self.model.layers.27.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4329" name="self.model.layers.27.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="6836688656" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4330" name="self.model.layers.27.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4331" name="__module.model.layers.27.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4332" name="__module.model.layers.27.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4640,value_states.55"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4333" name="Constant_1187855" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4334" name="__module.model.layers.27.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4648"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4335" name="__module.model.layers.27.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4336" name="__module.model.layers.27.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4649"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4337" name="__module.model.layers.27.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4709,4710,hidden_states.823,present.27.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4338" name="__module.model.layers.27.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4711,4712,4713"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4339" name="__module.model.layers.27.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4715,hidden_states.825"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4340" name="Constant_1187856" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4341" name="__module.model.layers.27.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4719"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4342" name="__module.model.layers.27.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4725,attn_output.109"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4343" name="__module.model.layers.27.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4344" name="__module.model.layers.27.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4726"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4345" name="__module.model.layers.27.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4729"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="4346" name="self.model.layers.27.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="6836690704" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4347" name="Convert_1230092" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4348" name="self.model.layers.27.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="6846127888" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4349" name="Convert_1230095" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4350" name="self.model.layers.27.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4351" name="self.model.layers.27.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="6846130960" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4352" name="self.model.layers.27.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4353" name="__module.model.layers.27.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4354" name="__module.model.layers.27.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4731,4733,hidden_states.827"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4355" name="__module.model.layers.27/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4736,4738,4749,hidden_states.829,hidden_states.831"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4356" name="Constant_1176111" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="6846137104" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4357" name="Constant_1176110" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4358" name="Constant_1176108" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4359" name="__module.model.layers.27.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4739"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4360" name="Constant_1115862" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4740"> <dim>1</dim> </port> </output> </layer> <layer id="4361" name="__module.model.layers.27.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4741,variance.111"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4362" name="Constant_1176109" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4363" name="__module.model.layers.27.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4742"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4364" name="__module.model.layers.27.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4365" name="__module.model.layers.27.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4743"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4366" name="__module.model.layers.27.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4744,4745,hidden_states.833,hidden_states.835"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4367" name="__module.model.layers.27.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4746,4748"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4368" name="self.model.layers.27.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="6846149392" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4369" name="Convert_1229162" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4370" name="self.model.layers.27.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="6916928272" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4371" name="Convert_1229165" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4372" name="self.model.layers.27.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4373" name="self.model.layers.27.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="6916951312" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4374" name="self.model.layers.27.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4375" name="__module.model.layers.27.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4376" name="__module.model.layers.27.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4754,input.55"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4377" name="__module.model.layers.27.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="4755"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4378" name="self.model.layers.27.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="6916997392" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4379" name="Convert_1229152" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4380" name="self.model.layers.27.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="6987776272" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4381" name="Convert_1229155" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4382" name="self.model.layers.27.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4383" name="self.model.layers.27.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="6987799312" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4384" name="self.model.layers.27.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4385" name="__module.model.layers.27.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4386" name="__module.model.layers.27.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4757"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4387" name="__module.model.layers.27.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4758"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4388" name="self.model.layers.27.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="6987845392" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4389" name="Convert_1229172" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4390" name="self.model.layers.27.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7058624272" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4391" name="Convert_1229175" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4392" name="self.model.layers.27.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4393" name="self.model.layers.27.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7058627344" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4394" name="self.model.layers.27.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4395" name="__module.model.layers.27.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4396" name="__module.model.layers.27.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4760,hidden_states.837"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4397" name="__module.model.layers.27/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4761,4763,4771,4782,hidden_states.839,hidden_states.841"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4398" name="Constant_1176115" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="7058633488" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4399" name="Constant_1176114" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4400" name="Constant_1176112" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4401" name="__module.model.layers.28.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4772"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4402" name="Constant_1115936" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4773"> <dim>1</dim> </port> </output> </layer> <layer id="4403" name="__module.model.layers.28.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4774,variance.113"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4404" name="Constant_1176113" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4405" name="__module.model.layers.28.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4775"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4406" name="__module.model.layers.28.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4407" name="__module.model.layers.28.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4776"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4408" name="__module.model.layers.28.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4777,4778,hidden_states.843,hidden_states.845"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4409" name="__module.model.layers.28.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4779,4781,hidden_states.847"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4410" name="self.model.layers.28.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="7058645776" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4411" name="Convert_1230102" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4412" name="self.model.layers.28.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7068082960" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4413" name="Convert_1230105" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4414" name="self.model.layers.28.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4415" name="self.model.layers.28.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7068086032" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4416" name="self.model.layers.28.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4417" name="__module.model.layers.28.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4418" name="__module.model.layers.28.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4790,query_states.57"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4419" name="Constant_1187857" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4420" name="__module.model.layers.28.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4796"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4421" name="__module.model.layers.28.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4422" name="__module.model.layers.28.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4797,q.57"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4423" name="__module.model.layers.28.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4806"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4424" name="Constant_1116333" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4425" name="Constant_1116335" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4426" name="Constant_1116337" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4427" name="__module.model.layers.28.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4816,x2.113"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4428" name="Constant_1176116" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4429" name="__module.model.layers.28.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4817"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4430" name="Constant_1116230" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4431" name="Constant_1116274" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4432" name="Constant_1116276" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4433" name="__module.model.layers.28.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4811"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4434" name="__module.model.layers.28.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4819"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4435" name="__module.model.layers.28.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4820"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4436" name="__module.model.layers.28.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4821"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4437" name="ReadValue_1190144" type="ReadValue" version="opset6"> <data variable_id="past_key_values.28.keypresent.28.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.28.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4438" name="Constant_1189543" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4439" name="Gather_1189544" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4440" name="self.model.layers.28.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="7068092176" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4441" name="Convert_1230912" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4442" name="self.model.layers.28.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="7071237904" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4443" name="Convert_1230915" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4444" name="self.model.layers.28.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4445" name="self.model.layers.28.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="7071238928" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4446" name="self.model.layers.28.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4447" name="__module.model.layers.28.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4448" name="__module.model.layers.28.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4792,key_states.117"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4449" name="Constant_1187858" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4450" name="__module.model.layers.28.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4799"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4451" name="__module.model.layers.28.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4452" name="__module.model.layers.28.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4800,k.57"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4453" name="__module.model.layers.28.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4822"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4454" name="Constant_1116476" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4455" name="Constant_1116478" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4456" name="Constant_1116480" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4457" name="__module.model.layers.28.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4832,x2.115"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4458" name="Constant_1176117" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4459" name="__module.model.layers.28.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4833"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4460" name="Constant_1116373" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4461" name="Constant_1116417" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4462" name="Constant_1116419" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4463" name="__module.model.layers.28.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4827"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4464" name="__module.model.layers.28.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4835"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4465" name="__module.model.layers.28.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4836"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4466" name="__module.model.layers.28.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4837"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4467" name="__module.model.layers.28.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4847,4848,hidden_states.849,present.28.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4468" name="__module.model.layers.28.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4849,4850,4851"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4469" name="__module.model.layers.28.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4853,hidden_states.851"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4470" name="Constant_1187859" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4471" name="__module.model.layers.28.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4857,key_states.119"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4472" name="ReadValue_1190146" type="ReadValue" version="opset6"> <data variable_id="past_key_values.28.valuepresent.28.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.28.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4473" name="Constant_1189546" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4474" name="Gather_1189547" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4475" name="self.model.layers.28.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="7071240976" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4476" name="Convert_1230902" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4477" name="self.model.layers.28.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="7074386704" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4478" name="Convert_1230905" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4479" name="self.model.layers.28.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4480" name="self.model.layers.28.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="7074387728" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4481" name="self.model.layers.28.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4482" name="__module.model.layers.28.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4483" name="__module.model.layers.28.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4794,value_states.57"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4484" name="Constant_1187860" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4485" name="__module.model.layers.28.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4802"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4486" name="__module.model.layers.28.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4487" name="__module.model.layers.28.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4803"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4488" name="__module.model.layers.28.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4863,4864,hidden_states.853,present.28.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4489" name="__module.model.layers.28.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="4865,4866,4867"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4490" name="__module.model.layers.28.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="4869,hidden_states.855"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4491" name="Constant_1187861" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4492" name="__module.model.layers.28.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4873"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4493" name="__module.model.layers.28.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4879,attn_output.113"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4494" name="__module.model.layers.28.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4495" name="__module.model.layers.28.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4880"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4496" name="__module.model.layers.28.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4883"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="4497" name="self.model.layers.28.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="7074389776" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4498" name="Convert_1230112" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4499" name="self.model.layers.28.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7083826960" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4500" name="Convert_1230115" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4501" name="self.model.layers.28.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4502" name="self.model.layers.28.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7083830032" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4503" name="self.model.layers.28.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4504" name="__module.model.layers.28.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4505" name="__module.model.layers.28.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4885,4887,hidden_states.857"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4506" name="__module.model.layers.28/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4890,4892,4903,hidden_states.859,hidden_states.861"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4507" name="Constant_1176121" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="7083836176" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4508" name="Constant_1176120" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4509" name="Constant_1176118" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4510" name="__module.model.layers.28.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4893"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4511" name="Constant_1117079" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4894"> <dim>1</dim> </port> </output> </layer> <layer id="4512" name="__module.model.layers.28.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4895,variance.115"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4513" name="Constant_1176119" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4514" name="__module.model.layers.28.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4896"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4515" name="__module.model.layers.28.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4516" name="__module.model.layers.28.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4897"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4517" name="__module.model.layers.28.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4898,4899,hidden_states.863,hidden_states.865"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4518" name="__module.model.layers.28.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4900,4902"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4519" name="self.model.layers.28.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="7083848464" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4520" name="Convert_1229192" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4521" name="self.model.layers.28.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="7154627344" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4522" name="Convert_1229195" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4523" name="self.model.layers.28.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4524" name="self.model.layers.28.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="7154650384" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4525" name="self.model.layers.28.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4526" name="__module.model.layers.28.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4527" name="__module.model.layers.28.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4908,input.57"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4528" name="__module.model.layers.28.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="4909"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4529" name="self.model.layers.28.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="7154696464" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4530" name="Convert_1229182" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4531" name="self.model.layers.28.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="7225475344" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4532" name="Convert_1229185" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4533" name="self.model.layers.28.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4534" name="self.model.layers.28.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="7225498384" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4535" name="self.model.layers.28.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4536" name="__module.model.layers.28.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4537" name="__module.model.layers.28.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4911"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4538" name="__module.model.layers.28.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4912"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4539" name="self.model.layers.28.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="7225544464" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4540" name="Convert_1229202" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4541" name="self.model.layers.28.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7296323344" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4542" name="Convert_1229205" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4543" name="self.model.layers.28.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4544" name="self.model.layers.28.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7296326416" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4545" name="self.model.layers.28.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4546" name="__module.model.layers.28.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4547" name="__module.model.layers.28.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="4914,hidden_states.867"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4548" name="__module.model.layers.28/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4915,4917,4925,4936,hidden_states.869,hidden_states.871"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4549" name="Constant_1176125" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="7296332560" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4550" name="Constant_1176124" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4551" name="Constant_1176122" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4552" name="__module.model.layers.29.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4926"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4553" name="Constant_1117153" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="4927"> <dim>1</dim> </port> </output> </layer> <layer id="4554" name="__module.model.layers.29.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4928,variance.117"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4555" name="Constant_1176123" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4556" name="__module.model.layers.29.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4929"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4557" name="__module.model.layers.29.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4558" name="__module.model.layers.29.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4930"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4559" name="__module.model.layers.29.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4931,4932,hidden_states.873,hidden_states.875"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4560" name="__module.model.layers.29.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4933,4935,hidden_states.877"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4561" name="self.model.layers.29.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="7296344848" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4562" name="Convert_1230122" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4563" name="self.model.layers.29.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7305782032" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4564" name="Convert_1230125" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4565" name="self.model.layers.29.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4566" name="self.model.layers.29.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7305785104" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4567" name="self.model.layers.29.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4568" name="__module.model.layers.29.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4569" name="__module.model.layers.29.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4944,query_states.59"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4570" name="Constant_1187862" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4571" name="__module.model.layers.29.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4950"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4572" name="__module.model.layers.29.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4573" name="__module.model.layers.29.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4951,q.59"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4574" name="__module.model.layers.29.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4960"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4575" name="Constant_1117550" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4576" name="Constant_1117552" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4577" name="Constant_1117554" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4578" name="__module.model.layers.29.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4970,x2.117"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4579" name="Constant_1176126" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4580" name="__module.model.layers.29.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4971"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4581" name="Constant_1117447" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4582" name="Constant_1117491" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4583" name="Constant_1117493" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4584" name="__module.model.layers.29.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4965"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4585" name="__module.model.layers.29.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4973"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4586" name="__module.model.layers.29.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4974"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4587" name="__module.model.layers.29.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4975"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4588" name="ReadValue_1190148" type="ReadValue" version="opset6"> <data variable_id="past_key_values.29.keypresent.29.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.29.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4589" name="Constant_1189549" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4590" name="Gather_1189550" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4591" name="self.model.layers.29.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="7305791248" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4592" name="Convert_1230932" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4593" name="self.model.layers.29.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="7308936976" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4594" name="Convert_1230935" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4595" name="self.model.layers.29.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4596" name="self.model.layers.29.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="7308938000" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4597" name="self.model.layers.29.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4598" name="__module.model.layers.29.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4599" name="__module.model.layers.29.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4946,key_states.121"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4600" name="Constant_1187863" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4601" name="__module.model.layers.29.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4953"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4602" name="__module.model.layers.29.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4603" name="__module.model.layers.29.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4954,k.59"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4604" name="__module.model.layers.29.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4976"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4605" name="Constant_1117693" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4606" name="Constant_1117695" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4607" name="Constant_1117697" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4608" name="__module.model.layers.29.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4986,x2.119"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4609" name="Constant_1176127" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4610" name="__module.model.layers.29.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4987"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4611" name="Constant_1117590" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4612" name="Constant_1117634" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4613" name="Constant_1117636" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4614" name="__module.model.layers.29.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4981"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4615" name="__module.model.layers.29.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="4989"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4616" name="__module.model.layers.29.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4990"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4617" name="__module.model.layers.29.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="4991"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4618" name="__module.model.layers.29.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5001,5002,hidden_states.879,present.29.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4619" name="__module.model.layers.29.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5003,5004,5005"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4620" name="__module.model.layers.29.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5007,hidden_states.881"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4621" name="Constant_1187864" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4622" name="__module.model.layers.29.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5011,key_states.123"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4623" name="ReadValue_1190150" type="ReadValue" version="opset6"> <data variable_id="past_key_values.29.valuepresent.29.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.29.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4624" name="Constant_1189552" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4625" name="Gather_1189553" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4626" name="self.model.layers.29.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="7308940048" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4627" name="Convert_1230922" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4628" name="self.model.layers.29.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="7312085776" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4629" name="Convert_1230925" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4630" name="self.model.layers.29.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4631" name="self.model.layers.29.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="7312086800" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4632" name="self.model.layers.29.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4633" name="__module.model.layers.29.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4634" name="__module.model.layers.29.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4948,value_states.59"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4635" name="Constant_1187865" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4636" name="__module.model.layers.29.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4956"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4637" name="__module.model.layers.29.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4638" name="__module.model.layers.29.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4957"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4639" name="__module.model.layers.29.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5017,5018,hidden_states.883,present.29.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4640" name="__module.model.layers.29.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5019,5020,5021"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4641" name="__module.model.layers.29.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5023,hidden_states.885"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4642" name="Constant_1187866" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4643" name="__module.model.layers.29.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5027"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4644" name="__module.model.layers.29.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5033,attn_output.117"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4645" name="__module.model.layers.29.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4646" name="__module.model.layers.29.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5034"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4647" name="__module.model.layers.29.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5037"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="4648" name="self.model.layers.29.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="7312088848" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4649" name="Convert_1230132" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4650" name="self.model.layers.29.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7321526032" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4651" name="Convert_1230135" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4652" name="self.model.layers.29.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4653" name="self.model.layers.29.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7321529104" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4654" name="self.model.layers.29.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4655" name="__module.model.layers.29.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4656" name="__module.model.layers.29.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5039,5041,hidden_states.887"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4657" name="__module.model.layers.29/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5044,5046,5057,hidden_states.889,hidden_states.891"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4658" name="Constant_1176131" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="7321535248" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4659" name="Constant_1176130" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4660" name="Constant_1176128" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4661" name="__module.model.layers.29.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5047"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4662" name="Constant_1118296" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5048"> <dim>1</dim> </port> </output> </layer> <layer id="4663" name="__module.model.layers.29.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5049,variance.119"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4664" name="Constant_1176129" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4665" name="__module.model.layers.29.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5050"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4666" name="__module.model.layers.29.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4667" name="__module.model.layers.29.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5051"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4668" name="__module.model.layers.29.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5052,5053,hidden_states.893,hidden_states.895"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4669" name="__module.model.layers.29.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5054,5056"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4670" name="self.model.layers.29.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="7321547536" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4671" name="Convert_1229222" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4672" name="self.model.layers.29.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="7392326416" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4673" name="Convert_1229225" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4674" name="self.model.layers.29.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4675" name="self.model.layers.29.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="7392349456" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4676" name="self.model.layers.29.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4677" name="__module.model.layers.29.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4678" name="__module.model.layers.29.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5062,input.59"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4679" name="__module.model.layers.29.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="5063"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4680" name="self.model.layers.29.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="7392395536" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4681" name="Convert_1229212" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4682" name="self.model.layers.29.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="7463174416" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4683" name="Convert_1229215" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4684" name="self.model.layers.29.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4685" name="self.model.layers.29.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="7463197456" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4686" name="self.model.layers.29.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4687" name="__module.model.layers.29.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4688" name="__module.model.layers.29.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5065"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4689" name="__module.model.layers.29.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5066"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4690" name="self.model.layers.29.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="7463243536" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4691" name="Convert_1229232" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4692" name="self.model.layers.29.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7534022416" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4693" name="Convert_1229235" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4694" name="self.model.layers.29.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4695" name="self.model.layers.29.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7534025488" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4696" name="self.model.layers.29.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4697" name="__module.model.layers.29.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4698" name="__module.model.layers.29.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5068,hidden_states.897"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4699" name="__module.model.layers.29/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5069,5071,5079,5090,hidden_states.899,hidden_states.901"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4700" name="Constant_1176135" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="7534031632" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4701" name="Constant_1176134" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4702" name="Constant_1176132" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4703" name="__module.model.layers.30.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5080"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4704" name="Constant_1118370" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5081"> <dim>1</dim> </port> </output> </layer> <layer id="4705" name="__module.model.layers.30.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5082,variance.121"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4706" name="Constant_1176133" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4707" name="__module.model.layers.30.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5083"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4708" name="__module.model.layers.30.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4709" name="__module.model.layers.30.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5084"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4710" name="__module.model.layers.30.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5085,5086,hidden_states.903,hidden_states.905"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4711" name="__module.model.layers.30.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5087,5089,hidden_states.907"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4712" name="self.model.layers.30.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="7534043920" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4713" name="Convert_1230142" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4714" name="self.model.layers.30.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7543481104" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4715" name="Convert_1230145" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4716" name="self.model.layers.30.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4717" name="self.model.layers.30.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7543484176" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4718" name="self.model.layers.30.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4719" name="__module.model.layers.30.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4720" name="__module.model.layers.30.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5098,query_states.61"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4721" name="Constant_1187867" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4722" name="__module.model.layers.30.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5104"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4723" name="__module.model.layers.30.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4724" name="__module.model.layers.30.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5105,q.61"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4725" name="__module.model.layers.30.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5114"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4726" name="Constant_1118767" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4727" name="Constant_1118769" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4728" name="Constant_1118771" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4729" name="__module.model.layers.30.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5124,x2.121"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4730" name="Constant_1176136" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4731" name="__module.model.layers.30.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5125"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4732" name="Constant_1118664" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4733" name="Constant_1118708" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4734" name="Constant_1118710" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4735" name="__module.model.layers.30.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5119"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4736" name="__module.model.layers.30.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5127"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4737" name="__module.model.layers.30.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5128"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4738" name="__module.model.layers.30.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5129"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4739" name="ReadValue_1190156" type="ReadValue" version="opset6"> <data variable_id="past_key_values.30.keypresent.30.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.30.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4740" name="Constant_1189555" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4741" name="Gather_1189556" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4742" name="self.model.layers.30.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="7543490320" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4743" name="Convert_1230952" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4744" name="self.model.layers.30.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="7546636048" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4745" name="Convert_1230955" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4746" name="self.model.layers.30.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4747" name="self.model.layers.30.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="7546637072" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4748" name="self.model.layers.30.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4749" name="__module.model.layers.30.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4750" name="__module.model.layers.30.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5100,key_states.125"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4751" name="Constant_1187868" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4752" name="__module.model.layers.30.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5107"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4753" name="__module.model.layers.30.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4754" name="__module.model.layers.30.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5108,k.61"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4755" name="__module.model.layers.30.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5130"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4756" name="Constant_1118910" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4757" name="Constant_1118912" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4758" name="Constant_1118914" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4759" name="__module.model.layers.30.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5140,x2.123"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4760" name="Constant_1176137" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4761" name="__module.model.layers.30.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5141"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4762" name="Constant_1118807" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4763" name="Constant_1118851" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4764" name="Constant_1118853" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4765" name="__module.model.layers.30.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5135"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4766" name="__module.model.layers.30.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5143"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4767" name="__module.model.layers.30.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5144"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4768" name="__module.model.layers.30.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5145"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4769" name="__module.model.layers.30.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5155,5156,hidden_states.909,present.30.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4770" name="__module.model.layers.30.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5157,5158,5159"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4771" name="__module.model.layers.30.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5161,hidden_states.911"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4772" name="Constant_1187869" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4773" name="__module.model.layers.30.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5165,key_states.127"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4774" name="ReadValue_1190158" type="ReadValue" version="opset6"> <data variable_id="past_key_values.30.valuepresent.30.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.30.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4775" name="Constant_1189558" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4776" name="Gather_1189559" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4777" name="self.model.layers.30.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="7546639120" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4778" name="Convert_1230942" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4779" name="self.model.layers.30.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="7549784848" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4780" name="Convert_1230945" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4781" name="self.model.layers.30.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4782" name="self.model.layers.30.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="7549785872" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4783" name="self.model.layers.30.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4784" name="__module.model.layers.30.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4785" name="__module.model.layers.30.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5102,value_states.61"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4786" name="Constant_1187870" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4787" name="__module.model.layers.30.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5110"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4788" name="__module.model.layers.30.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4789" name="__module.model.layers.30.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5111"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4790" name="__module.model.layers.30.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5171,5172,hidden_states.913,present.30.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4791" name="__module.model.layers.30.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5173,5174,5175"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4792" name="__module.model.layers.30.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5177,hidden_states.915"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4793" name="Constant_1187871" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4794" name="__module.model.layers.30.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5181"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4795" name="__module.model.layers.30.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5187,attn_output.121"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4796" name="__module.model.layers.30.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4797" name="__module.model.layers.30.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5188"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4798" name="__module.model.layers.30.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5191"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="4799" name="self.model.layers.30.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="7549787920" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4800" name="Convert_1230152" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4801" name="self.model.layers.30.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7559225104" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4802" name="Convert_1230155" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4803" name="self.model.layers.30.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4804" name="self.model.layers.30.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7559228176" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4805" name="self.model.layers.30.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4806" name="__module.model.layers.30.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4807" name="__module.model.layers.30.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5193,5195,hidden_states.917"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4808" name="__module.model.layers.30/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5198,5200,5211,hidden_states.919,hidden_states.921"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4809" name="Constant_1176141" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="7559234320" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4810" name="Constant_1176140" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4811" name="Constant_1176138" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4812" name="__module.model.layers.30.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5201"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4813" name="Constant_1119513" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5202"> <dim>1</dim> </port> </output> </layer> <layer id="4814" name="__module.model.layers.30.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5203,variance.123"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4815" name="Constant_1176139" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4816" name="__module.model.layers.30.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5204"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4817" name="__module.model.layers.30.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4818" name="__module.model.layers.30.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5205"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4819" name="__module.model.layers.30.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5206,5207,hidden_states.923,hidden_states.925"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4820" name="__module.model.layers.30.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5208,5210"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4821" name="self.model.layers.30.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="7559246608" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4822" name="Convert_1229252" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4823" name="self.model.layers.30.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="7630025488" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4824" name="Convert_1229255" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4825" name="self.model.layers.30.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4826" name="self.model.layers.30.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="7630048528" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4827" name="self.model.layers.30.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4828" name="__module.model.layers.30.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4829" name="__module.model.layers.30.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5216,input.61"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4830" name="__module.model.layers.30.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="5217"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4831" name="self.model.layers.30.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="7630094608" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4832" name="Convert_1229242" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4833" name="self.model.layers.30.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="7700873488" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4834" name="Convert_1229245" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4835" name="self.model.layers.30.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4836" name="self.model.layers.30.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="7700896528" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4837" name="self.model.layers.30.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4838" name="__module.model.layers.30.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4839" name="__module.model.layers.30.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5219"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4840" name="__module.model.layers.30.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5220"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4841" name="self.model.layers.30.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="7700942608" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4842" name="Convert_1229262" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4843" name="self.model.layers.30.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7771721488" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4844" name="Convert_1229265" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4845" name="self.model.layers.30.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4846" name="self.model.layers.30.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7771724560" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4847" name="self.model.layers.30.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4848" name="__module.model.layers.30.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4849" name="__module.model.layers.30.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5222,hidden_states.927"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4850" name="__module.model.layers.30/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5223,5225,5233,5244,hidden_states.929,hidden_states.931"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4851" name="Constant_1176145" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="7771730704" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4852" name="Constant_1176144" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4853" name="Constant_1176142" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4854" name="__module.model.layers.31.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5234"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4855" name="Constant_1119587" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5235"> <dim>1</dim> </port> </output> </layer> <layer id="4856" name="__module.model.layers.31.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5236,variance.125"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4857" name="Constant_1176143" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4858" name="__module.model.layers.31.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5237"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4859" name="__module.model.layers.31.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4860" name="__module.model.layers.31.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5238"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4861" name="__module.model.layers.31.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5239,5240,hidden_states.933,hidden_states.935"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4862" name="__module.model.layers.31.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5241,5243,hidden_states.937"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4863" name="self.model.layers.31.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="7771742992" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4864" name="Convert_1230162" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4865" name="self.model.layers.31.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7781180176" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4866" name="Convert_1230165" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4867" name="self.model.layers.31.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4868" name="self.model.layers.31.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7781183248" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4869" name="self.model.layers.31.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4870" name="__module.model.layers.31.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4871" name="__module.model.layers.31.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5252,query_states.63"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4872" name="Constant_1187872" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4873" name="__module.model.layers.31.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5258"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4874" name="__module.model.layers.31.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4875" name="__module.model.layers.31.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5259,q.63"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4876" name="__module.model.layers.31.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5268"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4877" name="Constant_1119984" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4878" name="Constant_1119986" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4879" name="Constant_1119988" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4880" name="__module.model.layers.31.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5278,x2.125"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4881" name="Constant_1176146" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4882" name="__module.model.layers.31.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5279"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4883" name="Constant_1119881" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4884" name="Constant_1119925" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4885" name="Constant_1119927" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4886" name="__module.model.layers.31.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5273"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4887" name="__module.model.layers.31.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5281"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4888" name="__module.model.layers.31.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5282"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4889" name="__module.model.layers.31.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5283"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4890" name="ReadValue_1190160" type="ReadValue" version="opset6"> <data variable_id="past_key_values.31.keypresent.31.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.31.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4891" name="Constant_1189561" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4892" name="Gather_1189562" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4893" name="self.model.layers.31.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="7781189392" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4894" name="Convert_1230972" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4895" name="self.model.layers.31.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="7784335120" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4896" name="Convert_1230975" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4897" name="self.model.layers.31.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4898" name="self.model.layers.31.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="7784336144" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4899" name="self.model.layers.31.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4900" name="__module.model.layers.31.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4901" name="__module.model.layers.31.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5254,key_states.129"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4902" name="Constant_1187873" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4903" name="__module.model.layers.31.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5261"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4904" name="__module.model.layers.31.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4905" name="__module.model.layers.31.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5262,k.63"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4906" name="__module.model.layers.31.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5284"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4907" name="Constant_1120127" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4908" name="Constant_1120129" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4909" name="Constant_1120131" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4910" name="__module.model.layers.31.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5294,x2.127"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4911" name="Constant_1176147" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4912" name="__module.model.layers.31.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5295"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4913" name="Constant_1120024" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4914" name="Constant_1120068" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4915" name="Constant_1120070" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4916" name="__module.model.layers.31.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5289"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="4917" name="__module.model.layers.31.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5297"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4918" name="__module.model.layers.31.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5298"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4919" name="__module.model.layers.31.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5299"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4920" name="__module.model.layers.31.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5309,5310,hidden_states.939,present.31.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4921" name="__module.model.layers.31.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5311,5312,5313"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4922" name="__module.model.layers.31.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5315,hidden_states.941"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4923" name="Constant_1187874" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4924" name="__module.model.layers.31.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5319,key_states.131"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4925" name="ReadValue_1190162" type="ReadValue" version="opset6"> <data variable_id="past_key_values.31.valuepresent.31.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.31.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4926" name="Constant_1189564" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4927" name="Gather_1189565" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4928" name="self.model.layers.31.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="7784338192" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4929" name="Convert_1230962" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4930" name="self.model.layers.31.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="7787483920" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4931" name="Convert_1230965" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4932" name="self.model.layers.31.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4933" name="self.model.layers.31.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="7787484944" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="4934" name="self.model.layers.31.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4935" name="__module.model.layers.31.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4936" name="__module.model.layers.31.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5256,value_states.63"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4937" name="Constant_1187875" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4938" name="__module.model.layers.31.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5264"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="4939" name="__module.model.layers.31.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4940" name="__module.model.layers.31.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5265"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4941" name="__module.model.layers.31.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5325,5326,hidden_states.943,present.31.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4942" name="__module.model.layers.31.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5327,5328,5329"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4943" name="__module.model.layers.31.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5331,hidden_states.945"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4944" name="Constant_1187876" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4945" name="__module.model.layers.31.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5335"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4946" name="__module.model.layers.31.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5341,attn_output.125"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="4947" name="__module.model.layers.31.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4948" name="__module.model.layers.31.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5342"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="4949" name="__module.model.layers.31.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5345"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="4950" name="self.model.layers.31.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="7787486992" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4951" name="Convert_1230172" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4952" name="self.model.layers.31.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="7796924176" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4953" name="Convert_1230175" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4954" name="self.model.layers.31.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4955" name="self.model.layers.31.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="7796927248" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4956" name="self.model.layers.31.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4957" name="__module.model.layers.31.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4958" name="__module.model.layers.31.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5347,5349,hidden_states.947"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4959" name="__module.model.layers.31/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5352,5354,5365,hidden_states.949,hidden_states.951"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4960" name="Constant_1176151" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="7796933392" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4961" name="Constant_1176150" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4962" name="Constant_1176148" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4963" name="__module.model.layers.31.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5355"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4964" name="Constant_1120730" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5356"> <dim>1</dim> </port> </output> </layer> <layer id="4965" name="__module.model.layers.31.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5357,variance.127"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4966" name="Constant_1176149" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4967" name="__module.model.layers.31.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5358"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4968" name="__module.model.layers.31.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4969" name="__module.model.layers.31.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5359"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4970" name="__module.model.layers.31.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5360,5361,hidden_states.953,hidden_states.955"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4971" name="__module.model.layers.31.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5362,5364"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4972" name="self.model.layers.31.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="7796945680" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4973" name="Convert_1229282" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4974" name="self.model.layers.31.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="7867724560" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4975" name="Convert_1229285" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4976" name="self.model.layers.31.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4977" name="self.model.layers.31.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="7867747600" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4978" name="self.model.layers.31.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4979" name="__module.model.layers.31.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4980" name="__module.model.layers.31.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5370,input.63"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4981" name="__module.model.layers.31.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="5371"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4982" name="self.model.layers.31.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="7867793680" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4983" name="Convert_1229272" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4984" name="self.model.layers.31.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="7938572560" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4985" name="Convert_1229275" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4986" name="self.model.layers.31.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4987" name="self.model.layers.31.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="7938595600" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="4988" name="self.model.layers.31.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4989" name="__module.model.layers.31.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4990" name="__module.model.layers.31.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5373"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4991" name="__module.model.layers.31.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5374"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4992" name="self.model.layers.31.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="7938641680" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4993" name="Convert_1229292" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4994" name="self.model.layers.31.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8009420560" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4995" name="Convert_1229295" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4996" name="self.model.layers.31.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4997" name="self.model.layers.31.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8009423632" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="4998" name="self.model.layers.31.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="4999" name="__module.model.layers.31.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5000" name="__module.model.layers.31.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5376,hidden_states.957"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5001" name="__module.model.layers.31/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5377,5379,5387,5398,hidden_states.959,hidden_states.961"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5002" name="Constant_1176155" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8009429776" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5003" name="Constant_1176154" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5004" name="Constant_1176152" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5005" name="__module.model.layers.32.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5388"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5006" name="Constant_1120804" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5389"> <dim>1</dim> </port> </output> </layer> <layer id="5007" name="__module.model.layers.32.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5390,variance.129"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5008" name="Constant_1176153" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5009" name="__module.model.layers.32.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5391"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5010" name="__module.model.layers.32.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5011" name="__module.model.layers.32.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5392"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5012" name="__module.model.layers.32.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5393,5394,hidden_states.963,hidden_states.965"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5013" name="__module.model.layers.32.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5395,5397,hidden_states.967"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5014" name="self.model.layers.32.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8009442064" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5015" name="Convert_1230182" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5016" name="self.model.layers.32.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8018879248" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5017" name="Convert_1230185" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5018" name="self.model.layers.32.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5019" name="self.model.layers.32.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8018882320" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5020" name="self.model.layers.32.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5021" name="__module.model.layers.32.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5022" name="__module.model.layers.32.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5406,query_states.65"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5023" name="Constant_1187877" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5024" name="__module.model.layers.32.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5412"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5025" name="__module.model.layers.32.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5026" name="__module.model.layers.32.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5413,q.65"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5027" name="__module.model.layers.32.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5422"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5028" name="Constant_1121201" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5029" name="Constant_1121203" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5030" name="Constant_1121205" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5031" name="__module.model.layers.32.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5432,x2.129"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5032" name="Constant_1176156" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5033" name="__module.model.layers.32.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5433"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5034" name="Constant_1121098" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5035" name="Constant_1121142" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5036" name="Constant_1121144" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5037" name="__module.model.layers.32.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5427"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5038" name="__module.model.layers.32.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5435"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5039" name="__module.model.layers.32.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5436"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5040" name="__module.model.layers.32.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5437"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5041" name="ReadValue_1190164" type="ReadValue" version="opset6"> <data variable_id="past_key_values.32.keypresent.32.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.32.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5042" name="Constant_1189567" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5043" name="Gather_1189568" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5044" name="self.model.layers.32.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8018888464" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5045" name="Convert_1230992" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5046" name="self.model.layers.32.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8022034192" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5047" name="Convert_1230995" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5048" name="self.model.layers.32.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5049" name="self.model.layers.32.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8022035216" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5050" name="self.model.layers.32.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5051" name="__module.model.layers.32.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5052" name="__module.model.layers.32.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5408,key_states.133"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5053" name="Constant_1187878" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5054" name="__module.model.layers.32.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5415"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5055" name="__module.model.layers.32.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5056" name="__module.model.layers.32.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5416,k.65"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5057" name="__module.model.layers.32.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5438"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5058" name="Constant_1121344" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5059" name="Constant_1121346" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5060" name="Constant_1121348" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5061" name="__module.model.layers.32.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5448,x2.131"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5062" name="Constant_1176157" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5063" name="__module.model.layers.32.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5449"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5064" name="Constant_1121241" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5065" name="Constant_1121285" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5066" name="Constant_1121287" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5067" name="__module.model.layers.32.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5443"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5068" name="__module.model.layers.32.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5451"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5069" name="__module.model.layers.32.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5452"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5070" name="__module.model.layers.32.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5453"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5071" name="__module.model.layers.32.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5463,5464,hidden_states.969,present.32.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5072" name="__module.model.layers.32.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5465,5466,5467"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5073" name="__module.model.layers.32.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5469,hidden_states.971"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5074" name="Constant_1187879" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5075" name="__module.model.layers.32.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5473,key_states.135"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5076" name="ReadValue_1190166" type="ReadValue" version="opset6"> <data variable_id="past_key_values.32.valuepresent.32.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.32.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5077" name="Constant_1189570" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5078" name="Gather_1189571" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5079" name="self.model.layers.32.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8022037264" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5080" name="Convert_1230982" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5081" name="self.model.layers.32.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8025182992" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5082" name="Convert_1230985" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5083" name="self.model.layers.32.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5084" name="self.model.layers.32.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8025184016" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5085" name="self.model.layers.32.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5086" name="__module.model.layers.32.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5087" name="__module.model.layers.32.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5410,value_states.65"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5088" name="Constant_1187880" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5089" name="__module.model.layers.32.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5418"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5090" name="__module.model.layers.32.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5091" name="__module.model.layers.32.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5419"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5092" name="__module.model.layers.32.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5479,5480,hidden_states.973,present.32.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5093" name="__module.model.layers.32.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5481,5482,5483"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5094" name="__module.model.layers.32.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5485,hidden_states.975"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5095" name="Constant_1187881" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5096" name="__module.model.layers.32.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5489"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5097" name="__module.model.layers.32.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5495,attn_output.129"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5098" name="__module.model.layers.32.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5099" name="__module.model.layers.32.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5496"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5100" name="__module.model.layers.32.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5499"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="5101" name="self.model.layers.32.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8025186064" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5102" name="Convert_1230192" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5103" name="self.model.layers.32.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8034623248" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5104" name="Convert_1230195" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5105" name="self.model.layers.32.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5106" name="self.model.layers.32.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8034626320" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5107" name="self.model.layers.32.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5108" name="__module.model.layers.32.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5109" name="__module.model.layers.32.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5501,5503,hidden_states.977"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5110" name="__module.model.layers.32/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5506,5508,5519,hidden_states.979,hidden_states.981"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5111" name="Constant_1176161" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8034632464" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5112" name="Constant_1176160" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5113" name="Constant_1176158" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5114" name="__module.model.layers.32.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5509"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5115" name="Constant_1121947" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5510"> <dim>1</dim> </port> </output> </layer> <layer id="5116" name="__module.model.layers.32.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5511,variance.131"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5117" name="Constant_1176159" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5118" name="__module.model.layers.32.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5512"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5119" name="__module.model.layers.32.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5120" name="__module.model.layers.32.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5513"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5121" name="__module.model.layers.32.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5514,5515,hidden_states.983,hidden_states.985"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5122" name="__module.model.layers.32.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5516,5518"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5123" name="self.model.layers.32.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="8034644752" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5124" name="Convert_1229312" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5125" name="self.model.layers.32.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="8105423632" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5126" name="Convert_1229315" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5127" name="self.model.layers.32.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5128" name="self.model.layers.32.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="8105446672" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5129" name="self.model.layers.32.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5130" name="__module.model.layers.32.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5131" name="__module.model.layers.32.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5524,input.65"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5132" name="__module.model.layers.32.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="5525"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5133" name="self.model.layers.32.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="8105492752" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5134" name="Convert_1229302" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5135" name="self.model.layers.32.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="8176271632" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5136" name="Convert_1229305" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5137" name="self.model.layers.32.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5138" name="self.model.layers.32.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="8176294672" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5139" name="self.model.layers.32.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5140" name="__module.model.layers.32.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5141" name="__module.model.layers.32.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5527"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5142" name="__module.model.layers.32.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5528"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5143" name="self.model.layers.32.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="8176340752" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5144" name="Convert_1229322" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5145" name="self.model.layers.32.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8247119632" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5146" name="Convert_1229325" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5147" name="self.model.layers.32.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5148" name="self.model.layers.32.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8247122704" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5149" name="self.model.layers.32.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5150" name="__module.model.layers.32.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5151" name="__module.model.layers.32.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5530,hidden_states.987"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5152" name="__module.model.layers.32/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5531,5533,5541,5552,hidden_states.989,hidden_states.991"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5153" name="Constant_1176165" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8247128848" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5154" name="Constant_1176164" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5155" name="Constant_1176162" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5156" name="__module.model.layers.33.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5542"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5157" name="Constant_1122021" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5543"> <dim>1</dim> </port> </output> </layer> <layer id="5158" name="__module.model.layers.33.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5544,variance.133"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5159" name="Constant_1176163" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5160" name="__module.model.layers.33.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5545"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5161" name="__module.model.layers.33.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5162" name="__module.model.layers.33.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5546"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5163" name="__module.model.layers.33.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5547,5548,hidden_states.993,hidden_states.995"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5164" name="__module.model.layers.33.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5549,5551,hidden_states.997"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5165" name="self.model.layers.33.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8247141136" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5166" name="Convert_1230202" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5167" name="self.model.layers.33.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8256578320" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5168" name="Convert_1230205" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5169" name="self.model.layers.33.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5170" name="self.model.layers.33.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8256581392" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5171" name="self.model.layers.33.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5172" name="__module.model.layers.33.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5173" name="__module.model.layers.33.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5560,query_states.67"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5174" name="Constant_1187882" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5175" name="__module.model.layers.33.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5566"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5176" name="__module.model.layers.33.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5177" name="__module.model.layers.33.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5567,q.67"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5178" name="__module.model.layers.33.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5576"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5179" name="Constant_1122418" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5180" name="Constant_1122420" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5181" name="Constant_1122422" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5182" name="__module.model.layers.33.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5586,x2.133"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5183" name="Constant_1176166" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5184" name="__module.model.layers.33.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5587"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5185" name="Constant_1122315" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5186" name="Constant_1122359" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5187" name="Constant_1122361" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5188" name="__module.model.layers.33.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5581"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5189" name="__module.model.layers.33.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5589"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5190" name="__module.model.layers.33.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5590"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5191" name="__module.model.layers.33.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5591"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5192" name="ReadValue_1190168" type="ReadValue" version="opset6"> <data variable_id="past_key_values.33.keypresent.33.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.33.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5193" name="Constant_1189573" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5194" name="Gather_1189574" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5195" name="self.model.layers.33.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8256587536" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5196" name="Convert_1231012" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5197" name="self.model.layers.33.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8259733264" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5198" name="Convert_1231015" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5199" name="self.model.layers.33.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5200" name="self.model.layers.33.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8259734288" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5201" name="self.model.layers.33.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5202" name="__module.model.layers.33.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5203" name="__module.model.layers.33.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5562,key_states.137"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5204" name="Constant_1187883" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5205" name="__module.model.layers.33.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5569"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5206" name="__module.model.layers.33.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5207" name="__module.model.layers.33.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5570,k.67"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5208" name="__module.model.layers.33.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5592"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5209" name="Constant_1122561" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5210" name="Constant_1122563" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5211" name="Constant_1122565" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5212" name="__module.model.layers.33.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5602,x2.135"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5213" name="Constant_1176167" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5214" name="__module.model.layers.33.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5603"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5215" name="Constant_1122458" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5216" name="Constant_1122502" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5217" name="Constant_1122504" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5218" name="__module.model.layers.33.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5597"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5219" name="__module.model.layers.33.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5605"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5220" name="__module.model.layers.33.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5606"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5221" name="__module.model.layers.33.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5607"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5222" name="__module.model.layers.33.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5617,5618,hidden_states.999,present.33.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5223" name="__module.model.layers.33.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5619,5620,5621"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5224" name="__module.model.layers.33.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5623,hidden_states.1001"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5225" name="Constant_1187884" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5226" name="__module.model.layers.33.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5627,key_states.139"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5227" name="ReadValue_1190170" type="ReadValue" version="opset6"> <data variable_id="past_key_values.33.valuepresent.33.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.33.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5228" name="Constant_1189576" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5229" name="Gather_1189577" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5230" name="self.model.layers.33.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8259736336" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5231" name="Convert_1231002" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5232" name="self.model.layers.33.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8262882064" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5233" name="Convert_1231005" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5234" name="self.model.layers.33.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5235" name="self.model.layers.33.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8262883088" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5236" name="self.model.layers.33.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5237" name="__module.model.layers.33.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5238" name="__module.model.layers.33.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5564,value_states.67"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5239" name="Constant_1187885" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5240" name="__module.model.layers.33.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5572"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5241" name="__module.model.layers.33.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5242" name="__module.model.layers.33.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5573"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5243" name="__module.model.layers.33.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5633,5634,hidden_states.1003,present.33.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5244" name="__module.model.layers.33.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5635,5636,5637"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5245" name="__module.model.layers.33.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5639,hidden_states.1005"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5246" name="Constant_1187886" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5247" name="__module.model.layers.33.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5643"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5248" name="__module.model.layers.33.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5649,attn_output.133"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5249" name="__module.model.layers.33.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5250" name="__module.model.layers.33.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5650"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5251" name="__module.model.layers.33.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5653"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="5252" name="self.model.layers.33.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8262885136" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5253" name="Convert_1230212" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5254" name="self.model.layers.33.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8272322320" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5255" name="Convert_1230215" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5256" name="self.model.layers.33.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5257" name="self.model.layers.33.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8272325392" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5258" name="self.model.layers.33.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5259" name="__module.model.layers.33.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5260" name="__module.model.layers.33.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5655,5657,hidden_states.1007"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5261" name="__module.model.layers.33/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5660,5662,5673,hidden_states.1009,hidden_states.1011"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5262" name="Constant_1176171" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8272331536" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5263" name="Constant_1176170" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5264" name="Constant_1176168" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5265" name="__module.model.layers.33.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5663"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5266" name="Constant_1123164" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5664"> <dim>1</dim> </port> </output> </layer> <layer id="5267" name="__module.model.layers.33.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5665,variance.135"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5268" name="Constant_1176169" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5269" name="__module.model.layers.33.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5666"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5270" name="__module.model.layers.33.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5271" name="__module.model.layers.33.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5667"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5272" name="__module.model.layers.33.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5668,5669,hidden_states.1013,hidden_states.1015"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5273" name="__module.model.layers.33.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5670,5672"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5274" name="self.model.layers.33.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="8272343824" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5275" name="Convert_1229342" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5276" name="self.model.layers.33.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="8343122704" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5277" name="Convert_1229345" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5278" name="self.model.layers.33.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5279" name="self.model.layers.33.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="8343145744" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5280" name="self.model.layers.33.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5281" name="__module.model.layers.33.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5282" name="__module.model.layers.33.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5678,input.67"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5283" name="__module.model.layers.33.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="5679"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5284" name="self.model.layers.33.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="8343191824" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5285" name="Convert_1229332" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5286" name="self.model.layers.33.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="8413970704" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5287" name="Convert_1229335" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5288" name="self.model.layers.33.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5289" name="self.model.layers.33.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="8413993744" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5290" name="self.model.layers.33.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5291" name="__module.model.layers.33.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5292" name="__module.model.layers.33.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5681"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5293" name="__module.model.layers.33.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5682"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5294" name="self.model.layers.33.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="8414039824" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5295" name="Convert_1229352" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5296" name="self.model.layers.33.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8484818704" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5297" name="Convert_1229355" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5298" name="self.model.layers.33.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5299" name="self.model.layers.33.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8484821776" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5300" name="self.model.layers.33.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5301" name="__module.model.layers.33.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5302" name="__module.model.layers.33.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5684,hidden_states.1017"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5303" name="__module.model.layers.33/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5685,5687,5695,5706,hidden_states.1019,hidden_states.1021"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5304" name="Constant_1176175" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8484827920" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5305" name="Constant_1176174" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5306" name="Constant_1176172" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5307" name="__module.model.layers.34.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5696"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5308" name="Constant_1123238" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5697"> <dim>1</dim> </port> </output> </layer> <layer id="5309" name="__module.model.layers.34.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5698,variance.137"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5310" name="Constant_1176173" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5311" name="__module.model.layers.34.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5699"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5312" name="__module.model.layers.34.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5313" name="__module.model.layers.34.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5700"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5314" name="__module.model.layers.34.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5701,5702,hidden_states.1023,hidden_states.1025"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5315" name="__module.model.layers.34.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5703,5705,hidden_states.1027"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5316" name="self.model.layers.34.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8484840208" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5317" name="Convert_1230222" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5318" name="self.model.layers.34.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8494277392" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5319" name="Convert_1230225" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5320" name="self.model.layers.34.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5321" name="self.model.layers.34.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8494280464" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5322" name="self.model.layers.34.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5323" name="__module.model.layers.34.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5324" name="__module.model.layers.34.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5714,query_states.69"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5325" name="Constant_1187887" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5326" name="__module.model.layers.34.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5720"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5327" name="__module.model.layers.34.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5328" name="__module.model.layers.34.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5721,q.69"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5329" name="__module.model.layers.34.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5730"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5330" name="Constant_1123635" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5331" name="Constant_1123637" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5332" name="Constant_1123639" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5333" name="__module.model.layers.34.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5740,x2.137"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5334" name="Constant_1176176" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5335" name="__module.model.layers.34.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5741"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5336" name="Constant_1123532" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5337" name="Constant_1123576" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5338" name="Constant_1123578" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5339" name="__module.model.layers.34.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5735"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5340" name="__module.model.layers.34.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5743"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5341" name="__module.model.layers.34.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5744"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5342" name="__module.model.layers.34.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5745"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5343" name="ReadValue_1190172" type="ReadValue" version="opset6"> <data variable_id="past_key_values.34.keypresent.34.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.34.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5344" name="Constant_1189579" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5345" name="Gather_1189580" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5346" name="self.model.layers.34.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8494286608" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5347" name="Convert_1231032" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5348" name="self.model.layers.34.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8497432336" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5349" name="Convert_1231035" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5350" name="self.model.layers.34.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5351" name="self.model.layers.34.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8497433360" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5352" name="self.model.layers.34.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5353" name="__module.model.layers.34.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5354" name="__module.model.layers.34.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5716,key_states.141"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5355" name="Constant_1187888" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5356" name="__module.model.layers.34.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5723"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5357" name="__module.model.layers.34.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5358" name="__module.model.layers.34.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5724,k.69"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5359" name="__module.model.layers.34.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5746"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5360" name="Constant_1123778" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5361" name="Constant_1123780" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5362" name="Constant_1123782" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5363" name="__module.model.layers.34.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5756,x2.139"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5364" name="Constant_1176177" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5365" name="__module.model.layers.34.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5757"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5366" name="Constant_1123675" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5367" name="Constant_1123719" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5368" name="Constant_1123721" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5369" name="__module.model.layers.34.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5751"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5370" name="__module.model.layers.34.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5759"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5371" name="__module.model.layers.34.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5760"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5372" name="__module.model.layers.34.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5761"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5373" name="__module.model.layers.34.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5771,5772,hidden_states.1029,present.34.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5374" name="__module.model.layers.34.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5773,5774,5775"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5375" name="__module.model.layers.34.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5777,hidden_states.1031"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5376" name="Constant_1187889" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5377" name="__module.model.layers.34.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5781,key_states.143"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5378" name="ReadValue_1190174" type="ReadValue" version="opset6"> <data variable_id="past_key_values.34.valuepresent.34.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.34.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5379" name="Constant_1189582" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5380" name="Gather_1189583" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5381" name="self.model.layers.34.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8497435408" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5382" name="Convert_1231022" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5383" name="self.model.layers.34.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8500581136" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5384" name="Convert_1231025" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5385" name="self.model.layers.34.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5386" name="self.model.layers.34.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8500582160" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5387" name="self.model.layers.34.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5388" name="__module.model.layers.34.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5389" name="__module.model.layers.34.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5718,value_states.69"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5390" name="Constant_1187890" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5391" name="__module.model.layers.34.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5726"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5392" name="__module.model.layers.34.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5393" name="__module.model.layers.34.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5727"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5394" name="__module.model.layers.34.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5787,5788,hidden_states.1033,present.34.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5395" name="__module.model.layers.34.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5789,5790,5791"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5396" name="__module.model.layers.34.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5793,hidden_states.1035"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5397" name="Constant_1187891" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5398" name="__module.model.layers.34.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5797"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5399" name="__module.model.layers.34.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5803,attn_output.137"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5400" name="__module.model.layers.34.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5401" name="__module.model.layers.34.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5804"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5402" name="__module.model.layers.34.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5807"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="5403" name="self.model.layers.34.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8500584208" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5404" name="Convert_1230232" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5405" name="self.model.layers.34.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8510021392" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5406" name="Convert_1230235" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5407" name="self.model.layers.34.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5408" name="self.model.layers.34.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8510024464" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5409" name="self.model.layers.34.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5410" name="__module.model.layers.34.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5411" name="__module.model.layers.34.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5809,5811,hidden_states.1037"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5412" name="__module.model.layers.34/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5814,5816,5827,hidden_states.1039,hidden_states.1041"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5413" name="Constant_1176181" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8510030608" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5414" name="Constant_1176180" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5415" name="Constant_1176178" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5416" name="__module.model.layers.34.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5817"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5417" name="Constant_1124381" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5818"> <dim>1</dim> </port> </output> </layer> <layer id="5418" name="__module.model.layers.34.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5819,variance.139"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5419" name="Constant_1176179" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5420" name="__module.model.layers.34.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5820"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5421" name="__module.model.layers.34.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5422" name="__module.model.layers.34.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5821"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5423" name="__module.model.layers.34.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5822,5823,hidden_states.1043,hidden_states.1045"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5424" name="__module.model.layers.34.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5824,5826"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5425" name="self.model.layers.34.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="8510042896" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5426" name="Convert_1229372" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5427" name="self.model.layers.34.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="8580821776" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5428" name="Convert_1229375" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5429" name="self.model.layers.34.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5430" name="self.model.layers.34.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="8580844816" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5431" name="self.model.layers.34.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5432" name="__module.model.layers.34.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5433" name="__module.model.layers.34.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5832,input.69"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5434" name="__module.model.layers.34.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="5833"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5435" name="self.model.layers.34.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="8580890896" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5436" name="Convert_1229362" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5437" name="self.model.layers.34.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="8651669776" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5438" name="Convert_1229365" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5439" name="self.model.layers.34.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5440" name="self.model.layers.34.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="8651692816" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5441" name="self.model.layers.34.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5442" name="__module.model.layers.34.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5443" name="__module.model.layers.34.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5835"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5444" name="__module.model.layers.34.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5836"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5445" name="self.model.layers.34.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="8651738896" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5446" name="Convert_1229382" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5447" name="self.model.layers.34.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8722517776" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5448" name="Convert_1229385" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5449" name="self.model.layers.34.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5450" name="self.model.layers.34.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8722520848" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5451" name="self.model.layers.34.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5452" name="__module.model.layers.34.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5453" name="__module.model.layers.34.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5838,hidden_states.1047"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5454" name="__module.model.layers.34/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5839,5841,5849,5860,hidden_states.1049,hidden_states.1051"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5455" name="Constant_1176185" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8722526992" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5456" name="Constant_1176184" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5457" name="Constant_1176182" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5458" name="__module.model.layers.35.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5850"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5459" name="Constant_1124455" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5851"> <dim>1</dim> </port> </output> </layer> <layer id="5460" name="__module.model.layers.35.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5852,variance.141"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5461" name="Constant_1176183" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5462" name="__module.model.layers.35.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5853"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5463" name="__module.model.layers.35.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5464" name="__module.model.layers.35.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5854"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5465" name="__module.model.layers.35.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5855,5856,hidden_states.1053,hidden_states.1055"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5466" name="__module.model.layers.35.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5857,5859,hidden_states.1057"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5467" name="self.model.layers.35.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8722539280" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5468" name="Convert_1230242" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5469" name="self.model.layers.35.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8731976464" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5470" name="Convert_1230245" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5471" name="self.model.layers.35.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5472" name="self.model.layers.35.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8731979536" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5473" name="self.model.layers.35.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5474" name="__module.model.layers.35.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5475" name="__module.model.layers.35.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5868,query_states.71"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5476" name="Constant_1187892" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5477" name="__module.model.layers.35.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5874"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5478" name="__module.model.layers.35.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5479" name="__module.model.layers.35.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5875,q.71"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5480" name="__module.model.layers.35.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5884"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5481" name="Constant_1124852" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5482" name="Constant_1124854" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5483" name="Constant_1124856" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5484" name="__module.model.layers.35.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5894,x2.141"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5485" name="Constant_1176186" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5486" name="__module.model.layers.35.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5895"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5487" name="Constant_1124749" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5488" name="Constant_1124793" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5489" name="Constant_1124795" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5490" name="__module.model.layers.35.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5889"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5491" name="__module.model.layers.35.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5897"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5492" name="__module.model.layers.35.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5898"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5493" name="__module.model.layers.35.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5899"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5494" name="ReadValue_1190176" type="ReadValue" version="opset6"> <data variable_id="past_key_values.35.keypresent.35.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.35.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5495" name="Constant_1189585" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5496" name="Gather_1189586" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5497" name="self.model.layers.35.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8731985680" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5498" name="Convert_1231052" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5499" name="self.model.layers.35.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8735131408" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5500" name="Convert_1231055" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5501" name="self.model.layers.35.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5502" name="self.model.layers.35.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8735132432" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5503" name="self.model.layers.35.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5504" name="__module.model.layers.35.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5505" name="__module.model.layers.35.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5870,key_states.145"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5506" name="Constant_1187893" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5507" name="__module.model.layers.35.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5877"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5508" name="__module.model.layers.35.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5509" name="__module.model.layers.35.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5878,k.71"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5510" name="__module.model.layers.35.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5900"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5511" name="Constant_1124995" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5512" name="Constant_1124997" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5513" name="Constant_1124999" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5514" name="__module.model.layers.35.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5910,x2.143"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5515" name="Constant_1176187" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5516" name="__module.model.layers.35.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5911"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5517" name="Constant_1124892" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5518" name="Constant_1124936" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5519" name="Constant_1124938" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5520" name="__module.model.layers.35.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5905"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5521" name="__module.model.layers.35.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="5913"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5522" name="__module.model.layers.35.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5914"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5523" name="__module.model.layers.35.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5915"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5524" name="__module.model.layers.35.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5925,5926,hidden_states.1059,present.35.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5525" name="__module.model.layers.35.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5927,5928,5929"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5526" name="__module.model.layers.35.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5931,hidden_states.1061"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5527" name="Constant_1187894" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5528" name="__module.model.layers.35.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5935,key_states.147"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5529" name="ReadValue_1190178" type="ReadValue" version="opset6"> <data variable_id="past_key_values.35.valuepresent.35.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.35.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5530" name="Constant_1189588" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5531" name="Gather_1189589" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5532" name="self.model.layers.35.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8735134480" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5533" name="Convert_1231042" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5534" name="self.model.layers.35.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8738280208" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5535" name="Convert_1231045" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5536" name="self.model.layers.35.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5537" name="self.model.layers.35.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8738281232" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5538" name="self.model.layers.35.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5539" name="__module.model.layers.35.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5540" name="__module.model.layers.35.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5872,value_states.71"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5541" name="Constant_1187895" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5542" name="__module.model.layers.35.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5880"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5543" name="__module.model.layers.35.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5544" name="__module.model.layers.35.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5881"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5545" name="__module.model.layers.35.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="5941,5942,hidden_states.1063,present.35.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5546" name="__module.model.layers.35.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="5943,5944,5945"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5547" name="__module.model.layers.35.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="5947,hidden_states.1065"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5548" name="Constant_1187896" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5549" name="__module.model.layers.35.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5951"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5550" name="__module.model.layers.35.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5957,attn_output.141"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5551" name="__module.model.layers.35.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5552" name="__module.model.layers.35.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5958"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5553" name="__module.model.layers.35.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5961"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="5554" name="self.model.layers.35.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8738283280" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5555" name="Convert_1230252" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5556" name="self.model.layers.35.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8747720464" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5557" name="Convert_1230255" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5558" name="self.model.layers.35.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5559" name="self.model.layers.35.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8747723536" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5560" name="self.model.layers.35.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5561" name="__module.model.layers.35.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5562" name="__module.model.layers.35.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5963,5965,hidden_states.1067"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5563" name="__module.model.layers.35/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5968,5970,5981,hidden_states.1069,hidden_states.1071"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5564" name="Constant_1176191" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8747729680" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5565" name="Constant_1176190" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5566" name="Constant_1176188" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5567" name="__module.model.layers.35.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5971"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5568" name="Constant_1125598" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="5972"> <dim>1</dim> </port> </output> </layer> <layer id="5569" name="__module.model.layers.35.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5973,variance.143"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5570" name="Constant_1176189" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5571" name="__module.model.layers.35.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5974"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5572" name="__module.model.layers.35.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5573" name="__module.model.layers.35.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5975"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5574" name="__module.model.layers.35.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5976,5977,hidden_states.1073,hidden_states.1075"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5575" name="__module.model.layers.35.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5978,5980"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5576" name="self.model.layers.35.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="8747741968" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5577" name="Convert_1229402" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5578" name="self.model.layers.35.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="8818520848" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5579" name="Convert_1229405" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5580" name="self.model.layers.35.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5581" name="self.model.layers.35.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="8818543888" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5582" name="self.model.layers.35.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5583" name="__module.model.layers.35.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5584" name="__module.model.layers.35.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5986,input.71"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5585" name="__module.model.layers.35.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="5987"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5586" name="self.model.layers.35.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="8818589968" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5587" name="Convert_1229392" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5588" name="self.model.layers.35.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="8889368848" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5589" name="Convert_1229395" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5590" name="self.model.layers.35.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5591" name="self.model.layers.35.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="8889391888" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5592" name="self.model.layers.35.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5593" name="__module.model.layers.35.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5594" name="__module.model.layers.35.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5989"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5595" name="__module.model.layers.35.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5990"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5596" name="self.model.layers.35.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="8889437968" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5597" name="Convert_1229412" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5598" name="self.model.layers.35.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8960216848" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5599" name="Convert_1229415" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5600" name="self.model.layers.35.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5601" name="self.model.layers.35.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8960219920" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5602" name="self.model.layers.35.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5603" name="__module.model.layers.35.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5604" name="__module.model.layers.35.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="5992,hidden_states.1077"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5605" name="__module.model.layers.35/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5993,5995,6003,6014,hidden_states.1079,hidden_states.1081"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5606" name="Constant_1176195" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8960226064" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5607" name="Constant_1176194" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5608" name="Constant_1176192" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5609" name="__module.model.layers.36.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6004"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5610" name="Constant_1125672" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="6005"> <dim>1</dim> </port> </output> </layer> <layer id="5611" name="__module.model.layers.36.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6006,variance.145"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5612" name="Constant_1176193" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5613" name="__module.model.layers.36.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6007"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5614" name="__module.model.layers.36.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5615" name="__module.model.layers.36.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6008"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5616" name="__module.model.layers.36.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6009,6010,hidden_states.1083,hidden_states.1085"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5617" name="__module.model.layers.36.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6011,6013,hidden_states.1087"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5618" name="self.model.layers.36.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8960238352" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5619" name="Convert_1230262" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5620" name="self.model.layers.36.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8969675536" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5621" name="Convert_1230265" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5622" name="self.model.layers.36.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5623" name="self.model.layers.36.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8969678608" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5624" name="self.model.layers.36.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5625" name="__module.model.layers.36.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5626" name="__module.model.layers.36.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6022,query_states.73"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5627" name="Constant_1187897" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5628" name="__module.model.layers.36.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6028"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5629" name="__module.model.layers.36.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5630" name="__module.model.layers.36.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6029,q.73"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5631" name="__module.model.layers.36.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6038"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5632" name="Constant_1126069" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5633" name="Constant_1126071" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5634" name="Constant_1126073" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5635" name="__module.model.layers.36.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6048,x2.145"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5636" name="Constant_1176196" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5637" name="__module.model.layers.36.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6049"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5638" name="Constant_1125966" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5639" name="Constant_1126010" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5640" name="Constant_1126012" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5641" name="__module.model.layers.36.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6043"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5642" name="__module.model.layers.36.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="6051"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5643" name="__module.model.layers.36.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6052"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5644" name="__module.model.layers.36.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6053"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5645" name="ReadValue_1190180" type="ReadValue" version="opset6"> <data variable_id="past_key_values.36.keypresent.36.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.36.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5646" name="Constant_1189591" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5647" name="Gather_1189592" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5648" name="self.model.layers.36.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8969684752" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5649" name="Convert_1231072" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5650" name="self.model.layers.36.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8972830480" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5651" name="Convert_1231075" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5652" name="self.model.layers.36.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5653" name="self.model.layers.36.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8972831504" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5654" name="self.model.layers.36.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5655" name="__module.model.layers.36.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5656" name="__module.model.layers.36.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6024,key_states.149"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5657" name="Constant_1187898" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5658" name="__module.model.layers.36.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6031"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5659" name="__module.model.layers.36.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5660" name="__module.model.layers.36.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6032,k.73"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5661" name="__module.model.layers.36.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6054"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5662" name="Constant_1126212" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5663" name="Constant_1126214" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5664" name="Constant_1126216" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5665" name="__module.model.layers.36.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6064,x2.147"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5666" name="Constant_1176197" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5667" name="__module.model.layers.36.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6065"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5668" name="Constant_1126109" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5669" name="Constant_1126153" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5670" name="Constant_1126155" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5671" name="__module.model.layers.36.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6059"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5672" name="__module.model.layers.36.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="6067"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5673" name="__module.model.layers.36.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6068"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5674" name="__module.model.layers.36.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6069"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5675" name="__module.model.layers.36.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6079,6080,hidden_states.1089,present.36.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5676" name="__module.model.layers.36.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="6081,6082,6083"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5677" name="__module.model.layers.36.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="6085,hidden_states.1091"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5678" name="Constant_1187899" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5679" name="__module.model.layers.36.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6089,key_states.151"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5680" name="ReadValue_1190182" type="ReadValue" version="opset6"> <data variable_id="past_key_values.36.valuepresent.36.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.36.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5681" name="Constant_1189594" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5682" name="Gather_1189595" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5683" name="self.model.layers.36.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="8972833552" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5684" name="Convert_1231062" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5685" name="self.model.layers.36.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="8975979280" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5686" name="Convert_1231065" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5687" name="self.model.layers.36.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5688" name="self.model.layers.36.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="8975980304" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5689" name="self.model.layers.36.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5690" name="__module.model.layers.36.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5691" name="__module.model.layers.36.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6026,value_states.73"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5692" name="Constant_1187900" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5693" name="__module.model.layers.36.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6034"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5694" name="__module.model.layers.36.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5695" name="__module.model.layers.36.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6035"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5696" name="__module.model.layers.36.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6095,6096,hidden_states.1093,present.36.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5697" name="__module.model.layers.36.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="6097,6098,6099"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5698" name="__module.model.layers.36.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="6101,hidden_states.1095"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5699" name="Constant_1187901" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5700" name="__module.model.layers.36.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6105"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5701" name="__module.model.layers.36.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="6111,attn_output.145"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5702" name="__module.model.layers.36.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5703" name="__module.model.layers.36.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6112"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5704" name="__module.model.layers.36.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="6115"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="5705" name="self.model.layers.36.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="8975982352" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5706" name="Convert_1230272" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5707" name="self.model.layers.36.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="8985419536" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5708" name="Convert_1230275" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5709" name="self.model.layers.36.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5710" name="self.model.layers.36.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="8985422608" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5711" name="self.model.layers.36.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5712" name="__module.model.layers.36.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5713" name="__module.model.layers.36.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6117,6119,hidden_states.1097"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5714" name="__module.model.layers.36/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6122,6124,6135,hidden_states.1099,hidden_states.1101"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5715" name="Constant_1176201" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="8985428752" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5716" name="Constant_1176200" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5717" name="Constant_1176198" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5718" name="__module.model.layers.36.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6125"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5719" name="Constant_1126815" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="6126"> <dim>1</dim> </port> </output> </layer> <layer id="5720" name="__module.model.layers.36.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6127,variance.147"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5721" name="Constant_1176199" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5722" name="__module.model.layers.36.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6128"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5723" name="__module.model.layers.36.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5724" name="__module.model.layers.36.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6129"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5725" name="__module.model.layers.36.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6130,6131,hidden_states.1103,hidden_states.1105"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5726" name="__module.model.layers.36.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6132,6134"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5727" name="self.model.layers.36.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="8985441040" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5728" name="Convert_1229432" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5729" name="self.model.layers.36.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="9056219920" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5730" name="Convert_1229435" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5731" name="self.model.layers.36.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5732" name="self.model.layers.36.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="9056242960" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5733" name="self.model.layers.36.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5734" name="__module.model.layers.36.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5735" name="__module.model.layers.36.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6140,input.73"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5736" name="__module.model.layers.36.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="6141"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5737" name="self.model.layers.36.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="9056289040" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5738" name="Convert_1229422" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5739" name="self.model.layers.36.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="9127067920" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5740" name="Convert_1229425" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5741" name="self.model.layers.36.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5742" name="self.model.layers.36.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="9127090960" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5743" name="self.model.layers.36.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5744" name="__module.model.layers.36.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5745" name="__module.model.layers.36.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6143"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5746" name="__module.model.layers.36.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="6144"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5747" name="self.model.layers.36.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="9127137040" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5748" name="Convert_1229442" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5749" name="self.model.layers.36.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9197915920" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5750" name="Convert_1229445" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5751" name="self.model.layers.36.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5752" name="self.model.layers.36.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9197918992" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5753" name="self.model.layers.36.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5754" name="__module.model.layers.36.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5755" name="__module.model.layers.36.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="6146,hidden_states.1107"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5756" name="__module.model.layers.36/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6147,6149,6157,6168,hidden_states.1109,hidden_states.1111"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5757" name="Constant_1176205" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="9197925136" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5758" name="Constant_1176204" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5759" name="Constant_1176202" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5760" name="__module.model.layers.37.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6158"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5761" name="Constant_1126889" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="6159"> <dim>1</dim> </port> </output> </layer> <layer id="5762" name="__module.model.layers.37.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6160,variance.149"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5763" name="Constant_1176203" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5764" name="__module.model.layers.37.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6161"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5765" name="__module.model.layers.37.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5766" name="__module.model.layers.37.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6162"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5767" name="__module.model.layers.37.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6163,6164,hidden_states.1113,hidden_states.1115"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5768" name="__module.model.layers.37.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6165,6167,hidden_states.1117"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5769" name="self.model.layers.37.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="9197937424" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5770" name="Convert_1230282" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5771" name="self.model.layers.37.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9207374608" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5772" name="Convert_1230285" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5773" name="self.model.layers.37.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5774" name="self.model.layers.37.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9207377680" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5775" name="self.model.layers.37.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5776" name="__module.model.layers.37.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5777" name="__module.model.layers.37.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6176,query_states.75"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5778" name="Constant_1187902" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5779" name="__module.model.layers.37.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6182"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5780" name="__module.model.layers.37.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5781" name="__module.model.layers.37.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6183,q.75"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5782" name="__module.model.layers.37.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6192"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5783" name="Constant_1127286" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5784" name="Constant_1127288" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5785" name="Constant_1127290" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5786" name="__module.model.layers.37.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6202,x2.149"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5787" name="Constant_1176206" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5788" name="__module.model.layers.37.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6203"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5789" name="Constant_1127183" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5790" name="Constant_1127227" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5791" name="Constant_1127229" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5792" name="__module.model.layers.37.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6197"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5793" name="__module.model.layers.37.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="6205"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5794" name="__module.model.layers.37.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6206"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5795" name="__module.model.layers.37.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6207"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5796" name="ReadValue_1190184" type="ReadValue" version="opset6"> <data variable_id="past_key_values.37.keypresent.37.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.37.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5797" name="Constant_1189597" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5798" name="Gather_1189598" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5799" name="self.model.layers.37.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="9207383824" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5800" name="Convert_1231092" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5801" name="self.model.layers.37.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="9210529552" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5802" name="Convert_1231095" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5803" name="self.model.layers.37.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5804" name="self.model.layers.37.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="9210530576" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5805" name="self.model.layers.37.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5806" name="__module.model.layers.37.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5807" name="__module.model.layers.37.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6178,key_states.153"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5808" name="Constant_1187903" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5809" name="__module.model.layers.37.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6185"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5810" name="__module.model.layers.37.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5811" name="__module.model.layers.37.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6186,k.75"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5812" name="__module.model.layers.37.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6208"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5813" name="Constant_1127429" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5814" name="Constant_1127431" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5815" name="Constant_1127433" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5816" name="__module.model.layers.37.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6218,x2.151"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5817" name="Constant_1176207" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5818" name="__module.model.layers.37.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6219"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5819" name="Constant_1127326" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5820" name="Constant_1127370" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5821" name="Constant_1127372" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5822" name="__module.model.layers.37.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6213"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5823" name="__module.model.layers.37.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="6221"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5824" name="__module.model.layers.37.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6222"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5825" name="__module.model.layers.37.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6223"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5826" name="__module.model.layers.37.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6233,6234,hidden_states.1119,present.37.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5827" name="__module.model.layers.37.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="6235,6236,6237"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5828" name="__module.model.layers.37.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="6239,hidden_states.1121"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5829" name="Constant_1187904" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5830" name="__module.model.layers.37.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6243,key_states.155"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5831" name="ReadValue_1190186" type="ReadValue" version="opset6"> <data variable_id="past_key_values.37.valuepresent.37.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.37.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5832" name="Constant_1189600" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5833" name="Gather_1189601" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5834" name="self.model.layers.37.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="9210532624" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5835" name="Convert_1231082" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5836" name="self.model.layers.37.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="9213678352" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5837" name="Convert_1231085" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5838" name="self.model.layers.37.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5839" name="self.model.layers.37.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="9213679376" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5840" name="self.model.layers.37.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5841" name="__module.model.layers.37.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5842" name="__module.model.layers.37.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6180,value_states.75"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5843" name="Constant_1187905" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5844" name="__module.model.layers.37.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6188"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5845" name="__module.model.layers.37.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5846" name="__module.model.layers.37.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6189"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5847" name="__module.model.layers.37.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6249,6250,hidden_states.1123,present.37.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5848" name="__module.model.layers.37.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="6251,6252,6253"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5849" name="__module.model.layers.37.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="6255,hidden_states.1125"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5850" name="Constant_1187906" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5851" name="__module.model.layers.37.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6259"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5852" name="__module.model.layers.37.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="6265,attn_output.149"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5853" name="__module.model.layers.37.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5854" name="__module.model.layers.37.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6266"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5855" name="__module.model.layers.37.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="6269"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="5856" name="self.model.layers.37.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="9213681424" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5857" name="Convert_1230292" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5858" name="self.model.layers.37.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9223118608" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5859" name="Convert_1230295" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5860" name="self.model.layers.37.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5861" name="self.model.layers.37.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9223121680" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5862" name="self.model.layers.37.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5863" name="__module.model.layers.37.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5864" name="__module.model.layers.37.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6271,6273,hidden_states.1127"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5865" name="__module.model.layers.37/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6276,6278,6289,hidden_states.1129,hidden_states.1131"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5866" name="Constant_1176211" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="9223127824" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5867" name="Constant_1176210" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5868" name="Constant_1176208" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5869" name="__module.model.layers.37.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6279"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5870" name="Constant_1128032" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="6280"> <dim>1</dim> </port> </output> </layer> <layer id="5871" name="__module.model.layers.37.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6281,variance.151"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5872" name="Constant_1176209" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5873" name="__module.model.layers.37.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6282"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5874" name="__module.model.layers.37.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5875" name="__module.model.layers.37.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6283"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5876" name="__module.model.layers.37.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6284,6285,hidden_states.1133,hidden_states.1135"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5877" name="__module.model.layers.37.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6286,6288"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5878" name="self.model.layers.37.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="9223140112" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5879" name="Convert_1229462" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5880" name="self.model.layers.37.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="9293918992" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5881" name="Convert_1229465" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5882" name="self.model.layers.37.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5883" name="self.model.layers.37.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="9293942032" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5884" name="self.model.layers.37.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5885" name="__module.model.layers.37.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5886" name="__module.model.layers.37.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6294,input.75"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5887" name="__module.model.layers.37.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="6295"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5888" name="self.model.layers.37.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="9293988112" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5889" name="Convert_1229452" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5890" name="self.model.layers.37.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="9364766992" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5891" name="Convert_1229455" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5892" name="self.model.layers.37.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5893" name="self.model.layers.37.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="9364790032" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="5894" name="self.model.layers.37.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5895" name="__module.model.layers.37.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5896" name="__module.model.layers.37.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6297"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5897" name="__module.model.layers.37.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="6298"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5898" name="self.model.layers.37.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="9364836112" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5899" name="Convert_1229472" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5900" name="self.model.layers.37.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9435614992" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5901" name="Convert_1229475" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5902" name="self.model.layers.37.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5903" name="self.model.layers.37.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9435618064" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5904" name="self.model.layers.37.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5905" name="__module.model.layers.37.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="5906" name="__module.model.layers.37.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="6300,hidden_states.1137"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5907" name="__module.model.layers.37/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6301,6303,6311,6322,hidden_states.1139,hidden_states.1141"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5908" name="Constant_1176215" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="9435624208" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5909" name="Constant_1176214" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5910" name="Constant_1176212" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5911" name="__module.model.layers.38.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6312"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5912" name="Constant_1128106" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="6313"> <dim>1</dim> </port> </output> </layer> <layer id="5913" name="__module.model.layers.38.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6314,variance.153"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5914" name="Constant_1176213" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5915" name="__module.model.layers.38.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6315"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5916" name="__module.model.layers.38.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5917" name="__module.model.layers.38.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6316"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5918" name="__module.model.layers.38.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6317,6318,hidden_states.1143,hidden_states.1145"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5919" name="__module.model.layers.38.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6319,6321,hidden_states.1147"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5920" name="self.model.layers.38.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="9435636496" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5921" name="Convert_1230302" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5922" name="self.model.layers.38.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9445073680" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5923" name="Convert_1230305" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5924" name="self.model.layers.38.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5925" name="self.model.layers.38.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9445076752" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="5926" name="self.model.layers.38.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5927" name="__module.model.layers.38.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5928" name="__module.model.layers.38.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6330,query_states.77"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5929" name="Constant_1187907" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5930" name="__module.model.layers.38.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6336"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="5931" name="__module.model.layers.38.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5932" name="__module.model.layers.38.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6337,q.77"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5933" name="__module.model.layers.38.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6346"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5934" name="Constant_1128503" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5935" name="Constant_1128505" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5936" name="Constant_1128507" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5937" name="__module.model.layers.38.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6356,x2.153"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5938" name="Constant_1176216" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5939" name="__module.model.layers.38.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6357"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5940" name="Constant_1128400" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5941" name="Constant_1128444" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5942" name="Constant_1128446" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5943" name="__module.model.layers.38.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6351"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5944" name="__module.model.layers.38.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="6359"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5945" name="__module.model.layers.38.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6360"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5946" name="__module.model.layers.38.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6361"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5947" name="ReadValue_1190188" type="ReadValue" version="opset6"> <data variable_id="past_key_values.38.keypresent.38.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.38.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5948" name="Constant_1189603" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5949" name="Gather_1189604" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5950" name="self.model.layers.38.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="9445082896" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5951" name="Convert_1231112" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5952" name="self.model.layers.38.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="9448228624" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5953" name="Convert_1231115" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5954" name="self.model.layers.38.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5955" name="self.model.layers.38.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="9448229648" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5956" name="self.model.layers.38.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5957" name="__module.model.layers.38.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5958" name="__module.model.layers.38.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6332,key_states.157"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5959" name="Constant_1187908" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5960" name="__module.model.layers.38.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6339"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5961" name="__module.model.layers.38.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5962" name="__module.model.layers.38.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6340,k.77"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5963" name="__module.model.layers.38.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6362"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5964" name="Constant_1128646" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5965" name="Constant_1128648" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5966" name="Constant_1128650" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5967" name="__module.model.layers.38.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6372,x2.155"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5968" name="Constant_1176217" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="5969" name="__module.model.layers.38.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6373"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5970" name="Constant_1128543" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5971" name="Constant_1128587" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5972" name="Constant_1128589" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="5973" name="__module.model.layers.38.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6367"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="5974" name="__module.model.layers.38.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="6375"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5975" name="__module.model.layers.38.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6376"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5976" name="__module.model.layers.38.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6377"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5977" name="__module.model.layers.38.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6387,6388,hidden_states.1149,present.38.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5978" name="__module.model.layers.38.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="6389,6390,6391"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5979" name="__module.model.layers.38.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="6393,hidden_states.1151"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5980" name="Constant_1187909" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5981" name="__module.model.layers.38.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6397,key_states.159"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5982" name="ReadValue_1190190" type="ReadValue" version="opset6"> <data variable_id="past_key_values.38.valuepresent.38.value" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.38.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5983" name="Constant_1189606" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="5984" name="Gather_1189607" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5985" name="self.model.layers.38.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="9448231696" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5986" name="Convert_1231102" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5987" name="self.model.layers.38.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="9451377424" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5988" name="Convert_1231105" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5989" name="self.model.layers.38.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5990" name="self.model.layers.38.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="9451378448" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="5991" name="self.model.layers.38.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5992" name="__module.model.layers.38.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="5993" name="__module.model.layers.38.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6334,value_states.77"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5994" name="Constant_1187910" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5995" name="__module.model.layers.38.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6342"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="5996" name="__module.model.layers.38.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5997" name="__module.model.layers.38.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6343"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5998" name="__module.model.layers.38.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6403,6404,hidden_states.1153,present.38.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="5999" name="__module.model.layers.38.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="6405,6406,6407"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6000" name="__module.model.layers.38.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="6409,hidden_states.1155"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6001" name="Constant_1187911" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="6002" name="__module.model.layers.38.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6413"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6003" name="__module.model.layers.38.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="6419,attn_output.153"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6004" name="__module.model.layers.38.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="6005" name="__module.model.layers.38.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6420"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="6006" name="__module.model.layers.38.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="6423"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="6007" name="self.model.layers.38.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="9451380496" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6008" name="Convert_1230312" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6009" name="self.model.layers.38.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9460817680" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6010" name="Convert_1230315" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6011" name="self.model.layers.38.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6012" name="self.model.layers.38.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9460820752" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6013" name="self.model.layers.38.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6014" name="__module.model.layers.38.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6015" name="__module.model.layers.38.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6425,6427,hidden_states.1157"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6016" name="__module.model.layers.38/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6430,6432,6443,hidden_states.1159,hidden_states.1161"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6017" name="Constant_1176221" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="9460826896" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6018" name="Constant_1176220" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6019" name="Constant_1176218" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6020" name="__module.model.layers.38.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6433"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6021" name="Constant_1129249" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="6434"> <dim>1</dim> </port> </output> </layer> <layer id="6022" name="__module.model.layers.38.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6435,variance.155"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6023" name="Constant_1176219" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6024" name="__module.model.layers.38.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6436"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6025" name="__module.model.layers.38.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6026" name="__module.model.layers.38.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6437"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6027" name="__module.model.layers.38.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6438,6439,hidden_states.1163,hidden_states.1165"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6028" name="__module.model.layers.38.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6440,6442"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6029" name="self.model.layers.38.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="9460839184" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6030" name="Convert_1229492" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6031" name="self.model.layers.38.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="9531618064" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6032" name="Convert_1229495" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6033" name="self.model.layers.38.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6034" name="self.model.layers.38.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="9531641104" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6035" name="self.model.layers.38.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6036" name="__module.model.layers.38.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6037" name="__module.model.layers.38.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6448,input.77"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6038" name="__module.model.layers.38.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="6449"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6039" name="self.model.layers.38.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="9531687184" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6040" name="Convert_1229482" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6041" name="self.model.layers.38.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="9602466064" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6042" name="Convert_1229485" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6043" name="self.model.layers.38.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6044" name="self.model.layers.38.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="9602489104" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6045" name="self.model.layers.38.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6046" name="__module.model.layers.38.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6047" name="__module.model.layers.38.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6451"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6048" name="__module.model.layers.38.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="6452"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6049" name="self.model.layers.38.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="9602535184" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6050" name="Convert_1229502" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6051" name="self.model.layers.38.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9673314064" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6052" name="Convert_1229505" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6053" name="self.model.layers.38.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6054" name="self.model.layers.38.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9673317136" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6055" name="self.model.layers.38.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6056" name="__module.model.layers.38.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6057" name="__module.model.layers.38.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="6454,hidden_states.1167"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6058" name="__module.model.layers.38/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6455,6457,6465,6476,hidden_states.1169,hidden_states.1171"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6059" name="Constant_1176224" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6060" name="Constant_1176222" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6061" name="__module.model.layers.39.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6466"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6062" name="Constant_1129323" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="6467"> <dim>1</dim> </port> </output> </layer> <layer id="6063" name="__module.model.layers.39.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6468,variance.157"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6064" name="Constant_1176223" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6065" name="__module.model.layers.39.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6469"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6066" name="__module.model.layers.39.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6067" name="__module.model.layers.39.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6470"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6068" name="__module.model.layers.39.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6471,6472,hidden_states.1173,hidden_states.1175"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6069" name="__module.model.layers.39.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6473,6475,hidden_states.1177"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6070" name="self.model.layers.39.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="9673323280" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6071" name="Convert_1231122" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6072" name="self.model.layers.39.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="9676469008" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="6073" name="Convert_1231125" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="6074" name="self.model.layers.39.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6075" name="self.model.layers.39.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="9676470032" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="6076" name="self.model.layers.39.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6077" name="__module.model.layers.39.self_attn.v_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6078" name="__module.model.layers.39.self_attn.v_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6488,value_states"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="6079" name="Constant_1187912" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="6080" name="__module.model.layers.39.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6496"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="6081" name="__module.model.layers.39.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="6082" name="__module.model.layers.39.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6497"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6083" name="__module.model.layers.39.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6557,6558,hidden_states.1183,present.39.value"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6085" name="ReadValue_1190192" type="ReadValue" version="opset6"> <data variable_id="past_key_values.39.keypresent.39.key" variable_type="f32" variable_shape="?,4,?,256" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>0</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.39.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6086" name="Constant_1189609" type="Const" version="opset1"> <data element_type="i64" shape="" offset="4" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="6087" name="Gather_1189610" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6088" name="self.model.layers.39.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="1024, 3072" offset="9676472080" size="3145728" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6089" name="Convert_1231132" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6090" name="self.model.layers.39.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="1024, 1" offset="9679617808" size="1024" /> <output> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="6091" name="Convert_1231135" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="6092" name="self.model.layers.39.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6093" name="self.model.layers.39.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 1" offset="9679618832" size="2048" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </output> </layer> <layer id="6094" name="self.model.layers.39.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6095" name="__module.model.layers.39.self_attn.k_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6096" name="__module.model.layers.39.self_attn.k_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6486,key_states.161"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="6097" name="Constant_1187913" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666832" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="6098" name="__module.model.layers.39.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6493"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> </output> </layer> <layer id="6099" name="__module.model.layers.39.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="6100" name="__module.model.layers.39.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6494,k"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6101" name="__module.model.layers.39.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6516"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6102" name="Constant_1129863" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6103" name="Constant_1129865" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6104" name="Constant_1129867" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6105" name="__module.model.layers.39.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6526,x2"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="6106" name="Constant_1176226" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6107" name="__module.model.layers.39.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6527"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="6108" name="Constant_1129760" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6109" name="Constant_1129804" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6110" name="Constant_1129806" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6111" name="__module.model.layers.39.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6521"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="6112" name="__module.model.layers.39.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="6529"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6113" name="__module.model.layers.39.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6530"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6114" name="__module.model.layers.39.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6531"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6115" name="__module.model.layers.39.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6541,6542,hidden_states.1179,present.39.key"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6183" name="Constant_1176235" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="9679620880" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6184" name="self.model.layers.39.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="9679633168" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6185" name="Convert_1230322" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6186" name="self.model.layers.39.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9689070352" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6187" name="Convert_1230325" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6188" name="self.model.layers.39.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6189" name="self.model.layers.39.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9689073424" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6190" name="self.model.layers.39.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6191" name="__module.model.layers.39.self_attn.q_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6192" name="__module.model.layers.39.self_attn.q_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6484,query_states"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6193" name="Constant_1187914" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="412517424" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="6194" name="__module.model.layers.39.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6490"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="6195" name="__module.model.layers.39.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="6196" name="__module.model.layers.39.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6491,q"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6197" name="__module.model.layers.39.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6500"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6198" name="Constant_1129720" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6199" name="Constant_1129722" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518012" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6200" name="Constant_1129724" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6201" name="__module.model.layers.39.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6510,x2.157"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="6202" name="Constant_1176227" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1, 1" offset="412518028" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6203" name="__module.model.layers.39.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6511"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="6204" name="Constant_1129617" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="4" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6205" name="Constant_1129661" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412518004" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6206" name="Constant_1129663" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="412517984" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="6207" name="__module.model.layers.39.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="6505"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </output> </layer> <layer id="6208" name="__module.model.layers.39.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>128</dim> </port> </input> <output> <port id="2" precision="FP32" names="6513"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6209" name="__module.model.layers.39.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6514"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6210" name="__module.model.layers.39.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="2" precision="FP32" names="6515"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6211" name="__module.model.layers.39.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="6543,6544,6545"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6212" name="__module.model.layers.39.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="6547,hidden_states.1181"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6213" name="Constant_1187915" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="6214" name="__module.model.layers.39.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6551,key_states"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6215" name="__module.model.layers.39.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="6559,6560,6561"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6216" name="__module.model.layers.39.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>1</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>5</dim> </port> </input> <output> <port id="2" precision="FP32" names="6563,hidden_states.1185"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6217" name="Constant_1187916" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="415666888" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="6218" name="__module.model.layers.39.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>3</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6567"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6219" name="__module.model.layers.39.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="6573,attn_output.157"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6220" name="__module.model.layers.39.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="412517456" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="6221" name="__module.model.layers.39.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>12</dim> <dim>-1</dim> <dim>256</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="6574"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> </output> </layer> <layer id="6222" name="__module.model.layers.39.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>12</dim> <dim>256</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="6577"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="6223" name="self.model.layers.39.self_attn.o_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 3072" offset="9689079568" size="9437184" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6224" name="Convert_1230332" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6225" name="self.model.layers.39.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9698516752" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6226" name="Convert_1230335" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6227" name="self.model.layers.39.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6228" name="self.model.layers.39.self_attn.o_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9698519824" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6229" name="self.model.layers.39.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6230" name="__module.model.layers.39.self_attn.o_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6231" name="__module.model.layers.39.self_attn.o_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6579,6581,hidden_states.1187"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6232" name="__module.model.layers.39/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6584,6586,6597,hidden_states.1189,hidden_states.1191"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6233" name="Constant_1176231" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 3072" offset="9698525968" size="12288" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6234" name="Constant_1176230" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6235" name="Constant_1176228" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6236" name="__module.model.layers.39.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6587"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6237" name="Constant_1130466" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="6588"> <dim>1</dim> </port> </output> </layer> <layer id="6238" name="__module.model.layers.39.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6589,variance.159"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6239" name="Constant_1176229" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6240" name="__module.model.layers.39.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6590"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6241" name="__module.model.layers.39.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6242" name="__module.model.layers.39.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6591"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6243" name="__module.model.layers.39.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6592,6593,hidden_states.1193,hidden_states.1195"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6244" name="__module.model.layers.39.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6594,6596"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6245" name="self.model.layers.39.mlp.gate_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="9698538256" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6246" name="Convert_1229522" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6247" name="self.model.layers.39.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="9769317136" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6248" name="Convert_1229525" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6249" name="self.model.layers.39.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6250" name="self.model.layers.39.mlp.gate_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="9769340176" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6251" name="self.model.layers.39.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6252" name="__module.model.layers.39.mlp.gate_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6253" name="__module.model.layers.39.mlp.gate_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6602,input"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6254" name="__module.model.layers.39.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32" names="6603"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6255" name="self.model.layers.39.mlp.up_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="23040, 3072" offset="9769386256" size="70778880" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6256" name="Convert_1229512" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6257" name="self.model.layers.39.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="23040, 1" offset="9840165136" size="23040" /> <output> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6258" name="Convert_1229515" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6259" name="self.model.layers.39.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6260" name="self.model.layers.39.mlp.up_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="23040, 1" offset="9840188176" size="46080" /> <output> <port id="0" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </output> </layer> <layer id="6261" name="self.model.layers.39.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>23040</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6262" name="__module.model.layers.39.mlp.up_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6263" name="__module.model.layers.39.mlp.up_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>23040</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6605"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6264" name="__module.model.layers.39.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="6606"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6265" name="self.model.layers.39.mlp.down_proj.weight" type="Const" version="opset1"> <data element_type="u8" shape="3072, 23040" offset="9840234256" size="70778880" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6266" name="Convert_1229532" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6267" name="self.model.layers.39.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="3072, 1" offset="9911013136" size="3072" /> <output> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6268" name="Convert_1229535" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6269" name="self.model.layers.39.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6270" name="self.model.layers.39.mlp.down_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="3072, 1" offset="9911016208" size="6144" /> <output> <port id="0" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6271" name="self.model.layers.39.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> <port id="1" precision="FP16"> <dim>3072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6272" name="__module.model.layers.39.mlp.down_proj/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </output> </layer> <layer id="6273" name="__module.model.layers.39.mlp.down_proj/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>23040</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>23040</dim> </port> </input> <output> <port id="2" precision="FP32" names="6608,hidden_states.1197"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6274" name="__module.model.layers.39/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="6609,6611,6615,hidden_states.1199,hidden_states.1201"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6275" name="Constant_1176234" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071004" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6276" name="Constant_1176232" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071008" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6277" name="__module.model.norm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6616"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6278" name="Constant_1130536" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="403071012" size="8" /> <output> <port id="0" precision="I64" names="6617"> <dim>1</dim> </port> </output> </layer> <layer id="6279" name="__module.model.norm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6618,variance"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6280" name="Constant_1176233" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1" offset="403071020" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6281" name="__module.model.norm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6619"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6282" name="__module.model.norm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6283" name="__module.model.norm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6620"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="6284" name="__module.model.norm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="6621,6622,hidden_states.1203,hidden_states.1205"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6285" name="__module.model.norm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="128,213,218,223,6623,hidden_states"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6286" name="self.lm_head.weight" type="Const" version="opset1"> <data element_type="u8" shape="131072, 3072" offset="9911022352" size="402653184" /> <output> <port id="0" precision="U8"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6287" name="Convert_1228332" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>131072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6288" name="self.lm_head.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="131072, 1" offset="10313675536" size="131072" /> <output> <port id="0" precision="U8"> <dim>131072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6289" name="Convert_1228335" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>131072</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>131072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6290" name="self.lm_head.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>131072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6291" name="self.lm_head.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="131072, 1" offset="10313806608" size="262144" /> <output> <port id="0" precision="FP16"> <dim>131072</dim> <dim>1</dim> </port> </output> </layer> <layer id="6292" name="self.lm_head.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> <port id="1" precision="FP16"> <dim>131072</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6293" name="__module.lm_head/ov_ext::linear/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>131072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>131072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="6294" name="__module.lm_head/ov_ext::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>131072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="logits"> <dim>-1</dim> <dim>-1</dim> <dim>131072</dim> </port> </output> </layer> <layer id="6182" name="Assign_1190061" type="Assign" version="opset6"> <data variable_id="past_key_values.0.keypresent.0.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6181" name="Assign_1190063" type="Assign" version="opset6"> <data variable_id="past_key_values.0.valuepresent.0.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6180" name="Assign_1190065" type="Assign" version="opset6"> <data variable_id="past_key_values.1.keypresent.1.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6179" name="Assign_1190067" type="Assign" version="opset6"> <data variable_id="past_key_values.1.valuepresent.1.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6178" name="Assign_1190069" type="Assign" version="opset6"> <data variable_id="past_key_values.10.keypresent.10.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6177" name="Assign_1190071" type="Assign" version="opset6"> <data variable_id="past_key_values.10.valuepresent.10.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6176" name="Assign_1190073" type="Assign" version="opset6"> <data variable_id="past_key_values.11.keypresent.11.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6175" name="Assign_1190075" type="Assign" version="opset6"> <data variable_id="past_key_values.11.valuepresent.11.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6174" name="Assign_1190077" type="Assign" version="opset6"> <data variable_id="past_key_values.12.keypresent.12.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6173" name="Assign_1190079" type="Assign" version="opset6"> <data variable_id="past_key_values.12.valuepresent.12.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6172" name="Assign_1190081" type="Assign" version="opset6"> <data variable_id="past_key_values.13.keypresent.13.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6171" name="Assign_1190083" type="Assign" version="opset6"> <data variable_id="past_key_values.13.valuepresent.13.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6170" name="Assign_1190085" type="Assign" version="opset6"> <data variable_id="past_key_values.14.keypresent.14.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6169" name="Assign_1190087" type="Assign" version="opset6"> <data variable_id="past_key_values.14.valuepresent.14.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6168" name="Assign_1190089" type="Assign" version="opset6"> <data variable_id="past_key_values.15.keypresent.15.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6167" name="Assign_1190091" type="Assign" version="opset6"> <data variable_id="past_key_values.15.valuepresent.15.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6166" name="Assign_1190093" type="Assign" version="opset6"> <data variable_id="past_key_values.16.keypresent.16.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6165" name="Assign_1190095" type="Assign" version="opset6"> <data variable_id="past_key_values.16.valuepresent.16.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6164" name="Assign_1190097" type="Assign" version="opset6"> <data variable_id="past_key_values.17.keypresent.17.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6163" name="Assign_1190099" type="Assign" version="opset6"> <data variable_id="past_key_values.17.valuepresent.17.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6162" name="Assign_1190101" type="Assign" version="opset6"> <data variable_id="past_key_values.18.keypresent.18.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6161" name="Assign_1190103" type="Assign" version="opset6"> <data variable_id="past_key_values.18.valuepresent.18.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6160" name="Assign_1190105" type="Assign" version="opset6"> <data variable_id="past_key_values.19.keypresent.19.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6159" name="Assign_1190107" type="Assign" version="opset6"> <data variable_id="past_key_values.19.valuepresent.19.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6158" name="Assign_1190109" type="Assign" version="opset6"> <data variable_id="past_key_values.2.keypresent.2.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6157" name="Assign_1190111" type="Assign" version="opset6"> <data variable_id="past_key_values.2.valuepresent.2.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6156" name="Assign_1190113" type="Assign" version="opset6"> <data variable_id="past_key_values.20.keypresent.20.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6155" name="Assign_1190115" type="Assign" version="opset6"> <data variable_id="past_key_values.20.valuepresent.20.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6154" name="Assign_1190117" type="Assign" version="opset6"> <data variable_id="past_key_values.21.keypresent.21.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6153" name="Assign_1190119" type="Assign" version="opset6"> <data variable_id="past_key_values.21.valuepresent.21.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6152" name="Assign_1190121" type="Assign" version="opset6"> <data variable_id="past_key_values.22.keypresent.22.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6151" name="Assign_1190123" type="Assign" version="opset6"> <data variable_id="past_key_values.22.valuepresent.22.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6150" name="Assign_1190125" type="Assign" version="opset6"> <data variable_id="past_key_values.23.keypresent.23.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6149" name="Assign_1190127" type="Assign" version="opset6"> <data variable_id="past_key_values.23.valuepresent.23.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6148" name="Assign_1190129" type="Assign" version="opset6"> <data variable_id="past_key_values.24.keypresent.24.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6147" name="Assign_1190131" type="Assign" version="opset6"> <data variable_id="past_key_values.24.valuepresent.24.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6146" name="Assign_1190133" type="Assign" version="opset6"> <data variable_id="past_key_values.25.keypresent.25.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6145" name="Assign_1190135" type="Assign" version="opset6"> <data variable_id="past_key_values.25.valuepresent.25.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6144" name="Assign_1190137" type="Assign" version="opset6"> <data variable_id="past_key_values.26.keypresent.26.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6143" name="Assign_1190139" type="Assign" version="opset6"> <data variable_id="past_key_values.26.valuepresent.26.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6142" name="Assign_1190141" type="Assign" version="opset6"> <data variable_id="past_key_values.27.keypresent.27.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6141" name="Assign_1190143" type="Assign" version="opset6"> <data variable_id="past_key_values.27.valuepresent.27.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6140" name="Assign_1190145" type="Assign" version="opset6"> <data variable_id="past_key_values.28.keypresent.28.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6139" name="Assign_1190147" type="Assign" version="opset6"> <data variable_id="past_key_values.28.valuepresent.28.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6138" name="Assign_1190149" type="Assign" version="opset6"> <data variable_id="past_key_values.29.keypresent.29.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6137" name="Assign_1190151" type="Assign" version="opset6"> <data variable_id="past_key_values.29.valuepresent.29.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6136" name="Assign_1190153" type="Assign" version="opset6"> <data variable_id="past_key_values.3.keypresent.3.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6135" name="Assign_1190155" type="Assign" version="opset6"> <data variable_id="past_key_values.3.valuepresent.3.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6134" name="Assign_1190157" type="Assign" version="opset6"> <data variable_id="past_key_values.30.keypresent.30.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6133" name="Assign_1190159" type="Assign" version="opset6"> <data variable_id="past_key_values.30.valuepresent.30.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6132" name="Assign_1190161" type="Assign" version="opset6"> <data variable_id="past_key_values.31.keypresent.31.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6131" name="Assign_1190163" type="Assign" version="opset6"> <data variable_id="past_key_values.31.valuepresent.31.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6130" name="Assign_1190165" type="Assign" version="opset6"> <data variable_id="past_key_values.32.keypresent.32.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6129" name="Assign_1190167" type="Assign" version="opset6"> <data variable_id="past_key_values.32.valuepresent.32.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6128" name="Assign_1190169" type="Assign" version="opset6"> <data variable_id="past_key_values.33.keypresent.33.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6127" name="Assign_1190171" type="Assign" version="opset6"> <data variable_id="past_key_values.33.valuepresent.33.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6126" name="Assign_1190173" type="Assign" version="opset6"> <data variable_id="past_key_values.34.keypresent.34.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6125" name="Assign_1190175" type="Assign" version="opset6"> <data variable_id="past_key_values.34.valuepresent.34.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6124" name="Assign_1190177" type="Assign" version="opset6"> <data variable_id="past_key_values.35.keypresent.35.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6123" name="Assign_1190179" type="Assign" version="opset6"> <data variable_id="past_key_values.35.valuepresent.35.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6122" name="Assign_1190181" type="Assign" version="opset6"> <data variable_id="past_key_values.36.keypresent.36.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6121" name="Assign_1190183" type="Assign" version="opset6"> <data variable_id="past_key_values.36.valuepresent.36.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6120" name="Assign_1190185" type="Assign" version="opset6"> <data variable_id="past_key_values.37.keypresent.37.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6119" name="Assign_1190187" type="Assign" version="opset6"> <data variable_id="past_key_values.37.valuepresent.37.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6118" name="Assign_1190189" type="Assign" version="opset6"> <data variable_id="past_key_values.38.keypresent.38.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6117" name="Assign_1190191" type="Assign" version="opset6"> <data variable_id="past_key_values.38.valuepresent.38.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6116" name="Assign_1190193" type="Assign" version="opset6"> <data variable_id="past_key_values.39.keypresent.39.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6084" name="Assign_1190195" type="Assign" version="opset6"> <data variable_id="past_key_values.39.valuepresent.39.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1584" name="Assign_1190197" type="Assign" version="opset6"> <data variable_id="past_key_values.4.keypresent.4.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1583" name="Assign_1190199" type="Assign" version="opset6"> <data variable_id="past_key_values.4.valuepresent.4.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1582" name="Assign_1190201" type="Assign" version="opset6"> <data variable_id="past_key_values.5.keypresent.5.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1581" name="Assign_1190203" type="Assign" version="opset6"> <data variable_id="past_key_values.5.valuepresent.5.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1580" name="Assign_1190205" type="Assign" version="opset6"> <data variable_id="past_key_values.6.keypresent.6.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1579" name="Assign_1190207" type="Assign" version="opset6"> <data variable_id="past_key_values.6.valuepresent.6.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1578" name="Assign_1190209" type="Assign" version="opset6"> <data variable_id="past_key_values.7.keypresent.7.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1577" name="Assign_1190211" type="Assign" version="opset6"> <data variable_id="past_key_values.7.valuepresent.7.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1576" name="Assign_1190213" type="Assign" version="opset6"> <data variable_id="past_key_values.8.keypresent.8.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1575" name="Assign_1190215" type="Assign" version="opset6"> <data variable_id="past_key_values.8.valuepresent.8.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1574" name="Assign_1190217" type="Assign" version="opset6"> <data variable_id="past_key_values.9.keypresent.9.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="1542" name="Assign_1190219" type="Assign" version="opset6"> <data variable_id="past_key_values.9.valuepresent.9.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>4</dim> <dim>-1</dim> <dim>256</dim> </port> </output> </layer> <layer id="6295" name="Result_1131373" type="Result" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>131072</dim> </port> </input> </layer> </layers> <edges> <edge from-layer="0" from-port="0" to-layer="1872" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2209" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="6087" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2174" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3986" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2058" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5984" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2023" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4021" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1907" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5949" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2325" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4137" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1756" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5833" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1721" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5798" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1587" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4172" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1545" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3382" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3080" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2929" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3719" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2813" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3835" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3684" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2778" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2964" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2662" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3568" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1442" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2627" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3533" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3870" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2511" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3115" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2476" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3417" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2360" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="91" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="16" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="687" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1407" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="652" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5380" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="536" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4625" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="501" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5345" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="385" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="146" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4590" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="350" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4741" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4776" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3266" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5229" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4892" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5194" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4927" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5078" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5043" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="803" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5682" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1291" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4288" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1256" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5647" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1140" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4323" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1105" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3231" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="989" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4439" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="954" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5531" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="838" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4474" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="5496" to-port="1" /> <edge from-layer="1" from-port="0" to-layer="64" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="231" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="168" to-port="0" /> <edge from-layer="3" from-port="0" to-layer="5" to-port="0" /> <edge from-layer="3" from-port="0" to-layer="26" to-port="0" /> <edge from-layer="4" from-port="0" to-layer="13" to-port="0" /> <edge from-layer="5" from-port="1" to-layer="8" to-port="0" /> <edge from-layer="6" from-port="0" to-layer="8" to-port="1" /> <edge from-layer="7" from-port="0" to-layer="8" to-port="2" /> <edge from-layer="8" from-port="3" to-layer="12" to-port="0" /> <edge from-layer="9" from-port="0" to-layer="12" to-port="1" /> <edge from-layer="10" from-port="0" to-layer="12" to-port="2" /> <edge from-layer="11" from-port="0" to-layer="12" to-port="3" /> <edge from-layer="12" from-port="4" to-layer="13" to-port="1" /> <edge from-layer="13" from-port="2" to-layer="685" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="383" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5494" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="801" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="836" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5529" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="952" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="987" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1103" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5645" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3229" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1138" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="650" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5378" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="534" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="499" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1254" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="348" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="144" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3264" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5227" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5192" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5076" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5343" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2021" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2962" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2811" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2776" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3078" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2660" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2625" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3113" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2509" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2474" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2358" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2323" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2207" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2172" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="6085" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2056" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="2927" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5982" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1905" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5947" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1870" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1754" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5831" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1719" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1585" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5796" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1543" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1440" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1405" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="1289" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5680" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4135" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4588" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3566" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4472" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4437" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4321" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3380" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4286" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4170" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="5041" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3682" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4019" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3717" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3984" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3833" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3415" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="89" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3868" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4925" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4623" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4890" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="14" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="3531" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4739" to-port="0" /> <edge from-layer="13" from-port="2" to-layer="4774" to-port="0" /> <edge from-layer="14" from-port="1" to-layer="16" to-port="0" /> <edge from-layer="15" from-port="0" to-layer="16" to-port="2" /> <edge from-layer="16" from-port="3" to-layer="1541" to-port="0" /> <edge from-layer="17" from-port="0" to-layer="1527" to-port="0" /> <edge from-layer="18" from-port="0" to-layer="19" to-port="0" /> <edge from-layer="19" from-port="1" to-layer="22" to-port="0" /> <edge from-layer="20" from-port="0" to-layer="21" to-port="0" /> <edge from-layer="21" from-port="1" to-layer="22" to-port="1" /> <edge from-layer="22" from-port="2" to-layer="24" to-port="0" /> <edge from-layer="23" from-port="0" to-layer="24" to-port="1" /> <edge from-layer="24" from-port="2" to-layer="25" to-port="0" /> <edge from-layer="25" from-port="1" to-layer="28" to-port="0" /> <edge from-layer="26" from-port="1" to-layer="28" to-port="1" /> <edge from-layer="27" from-port="0" to-layer="28" to-port="2" /> <edge from-layer="28" from-port="3" to-layer="266" to-port="0" /> <edge from-layer="28" from-port="3" to-layer="39" to-port="0" /> <edge from-layer="28" from-port="3" to-layer="32" to-port="0" /> <edge from-layer="29" from-port="0" to-layer="40" to-port="0" /> <edge from-layer="30" from-port="0" to-layer="38" to-port="0" /> <edge from-layer="31" from-port="0" to-layer="32" to-port="1" /> <edge from-layer="32" from-port="2" to-layer="34" to-port="0" /> <edge from-layer="33" from-port="0" to-layer="34" to-port="1" /> <edge from-layer="34" from-port="2" to-layer="36" to-port="0" /> <edge from-layer="35" from-port="0" to-layer="36" to-port="1" /> <edge from-layer="36" from-port="2" to-layer="37" to-port="0" /> <edge from-layer="37" from-port="1" to-layer="38" to-port="1" /> <edge from-layer="38" from-port="2" to-layer="39" to-port="1" /> <edge from-layer="39" from-port="2" to-layer="40" to-port="1" /> <edge from-layer="40" from-port="2" to-layer="55" to-port="0" /> <edge from-layer="40" from-port="2" to-layer="49" to-port="0" /> <edge from-layer="40" from-port="2" to-layer="100" to-port="0" /> <edge from-layer="40" from-port="2" to-layer="155" to-port="0" /> <edge from-layer="41" from-port="0" to-layer="42" to-port="0" /> <edge from-layer="42" from-port="1" to-layer="45" to-port="0" /> <edge from-layer="43" from-port="0" to-layer="44" to-port="0" /> <edge from-layer="44" from-port="1" to-layer="45" to-port="1" /> <edge from-layer="45" from-port="2" to-layer="47" to-port="0" /> <edge from-layer="46" from-port="0" to-layer="47" to-port="1" /> <edge from-layer="47" from-port="2" to-layer="48" to-port="0" /> <edge from-layer="48" from-port="1" to-layer="49" to-port="1" /> <edge from-layer="49" from-port="2" to-layer="51" to-port="0" /> <edge from-layer="50" from-port="0" to-layer="51" to-port="1" /> <edge from-layer="51" from-port="2" to-layer="53" to-port="0" /> <edge from-layer="52" from-port="0" to-layer="53" to-port="1" /> <edge from-layer="53" from-port="2" to-layer="72" to-port="0" /> <edge from-layer="53" from-port="2" to-layer="83" to-port="0" /> <edge from-layer="53" from-port="2" to-layer="77" to-port="0" /> <edge from-layer="54" from-port="0" to-layer="62" to-port="0" /> <edge from-layer="55" from-port="1" to-layer="253" to-port="0" /> <edge from-layer="55" from-port="1" to-layer="135" to-port="0" /> <edge from-layer="55" from-port="1" to-layer="58" to-port="0" /> <edge from-layer="56" from-port="0" to-layer="58" to-port="1" /> <edge from-layer="57" from-port="0" to-layer="58" to-port="2" /> <edge from-layer="58" from-port="3" to-layer="213" to-port="0" /> <edge from-layer="58" from-port="3" to-layer="61" to-port="0" /> <edge from-layer="59" from-port="0" to-layer="61" to-port="1" /> <edge from-layer="60" from-port="0" to-layer="61" to-port="2" /> <edge from-layer="61" from-port="3" to-layer="62" to-port="1" /> <edge from-layer="62" from-port="2" to-layer="66" to-port="0" /> <edge from-layer="63" from-port="0" to-layer="64" to-port="1" /> <edge from-layer="63" from-port="0" to-layer="209" to-port="1" /> <edge from-layer="63" from-port="0" to-layer="71" to-port="1" /> <edge from-layer="63" from-port="0" to-layer="86" to-port="1" /> <edge from-layer="63" from-port="0" to-layer="231" to-port="1" /> <edge from-layer="64" from-port="2" to-layer="65" to-port="0" /> <edge from-layer="65" from-port="1" to-layer="66" to-port="1" /> <edge from-layer="66" from-port="2" to-layer="68" to-port="0" /> <edge from-layer="67" from-port="0" to-layer="68" to-port="1" /> <edge from-layer="68" from-port="2" to-layer="69" to-port="0" /> <edge from-layer="68" from-port="2" to-layer="69" to-port="1" /> <edge from-layer="69" from-port="2" to-layer="85" to-port="0" /> <edge from-layer="69" from-port="2" to-layer="70" to-port="0" /> <edge from-layer="70" from-port="1" to-layer="71" to-port="0" /> <edge from-layer="71" from-port="2" to-layer="4302" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5510" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3245" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4453" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="817" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5631" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3366" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="938" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4423" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5661" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="968" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5480" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5782" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1089" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3215" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4272" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1119" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5812" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3396" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4755" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="334" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5178" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5027" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="364" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5208" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4906" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5329" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="485" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4876" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="787" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="515" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3517" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4725" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="636" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5359" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4604" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="666" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1270" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4574" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2611" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1602" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1705" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2792" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2762" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1735" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3668" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2641" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1856" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3547" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3698" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1886" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2490" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2007" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2460" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2037" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2339" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2158" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5057" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2309" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="6197" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4151" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5933" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2188" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="5963" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4121" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1391" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4000" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="6101" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1421" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1240" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3970" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3094" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3849" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3064" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2943" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3819" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1559" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2913" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="105" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="72" to-port="1" /> <edge from-layer="72" from-port="2" to-layer="88" to-port="0" /> <edge from-layer="73" from-port="0" to-layer="77" to-port="1" /> <edge from-layer="74" from-port="0" to-layer="77" to-port="2" /> <edge from-layer="75" from-port="0" to-layer="77" to-port="3" /> <edge from-layer="76" from-port="0" to-layer="6105" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="6201" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4306" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="640" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4312" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3376" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="109" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3370" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="6111" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="646" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4427" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4433" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4457" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4463" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2198" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="115" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2011" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4578" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4584" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2192" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2017" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4010" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3068" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3074" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3853" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3859" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3098" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="368" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3104" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3974" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3980" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4004" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="374" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="6207" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="676" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3406" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="670" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4125" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4131" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3400" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4155" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4161" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4276" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4282" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4608" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5363" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2162" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="525" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5188" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3219" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="519" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5212" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5218" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5333" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5339" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3225" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5671" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5665" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5786" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5369" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="495" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="489" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3255" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5641" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5635" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5484" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5490" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3249" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5514" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5520" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4886" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4614" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4729" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5973" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5967" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4735" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4759" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4765" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5943" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5937" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2041" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2047" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4880" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="942" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4910" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4916" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5031" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5037" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5822" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5816" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5061" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2168" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5067" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5792" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="5182" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1860" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2645" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2651" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1250" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1709" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1715" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1244" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="225" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1739" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1745" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1129" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1612" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1866" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1123" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2766" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2772" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3521" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2796" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2313" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2802" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3551" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="797" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2494" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2500" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1395" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1401" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="821" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1425" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1431" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1280" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1274" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2470" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3527" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="230" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1563" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2464" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1569" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2615" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2621" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="791" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="827" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1606" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1099" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="247" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2947" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="972" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="978" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3702" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2953" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1896" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2319" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3678" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2923" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3708" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2343" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="344" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2917" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="83" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1093" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="338" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3557" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3829" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="77" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3823" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1890" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2349" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3672" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="948" to-port="4" /> <edge from-layer="77" from-port="5" to-layer="79" to-port="0" /> <edge from-layer="78" from-port="0" to-layer="79" to-port="1" /> <edge from-layer="79" from-port="2" to-layer="84" to-port="0" /> <edge from-layer="80" from-port="0" to-layer="83" to-port="1" /> <edge from-layer="81" from-port="0" to-layer="83" to-port="2" /> <edge from-layer="82" from-port="0" to-layer="83" to-port="3" /> <edge from-layer="83" from-port="5" to-layer="84" to-port="1" /> <edge from-layer="84" from-port="2" to-layer="87" to-port="0" /> <edge from-layer="85" from-port="1" to-layer="86" to-port="0" /> <edge from-layer="86" from-port="2" to-layer="1282" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1101" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5522" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="497" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5069" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5371" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="527" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2321" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5190" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5341" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3257" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1131" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5492" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5220" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="980" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="829" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="950" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1252" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3408" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3529" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4314" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3378" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3559" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4284" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="648" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4163" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4133" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3680" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1868" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="678" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4012" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3982" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1898" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3710" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="87" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3861" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3831" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4616" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1403" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4918" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1433" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2049" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4888" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="799" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4767" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4737" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1571" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5039" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2019" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1614" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="117" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4586" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1717" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="1747" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4465" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="4435" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2200" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3227" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2774" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5673" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2653" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2623" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2804" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2925" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5643" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5975" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="346" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2955" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2502" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="6113" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2472" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5824" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2170" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3076" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="3106" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="2351" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5945" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="376" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="6209" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="5794" to-port="1" /> <edge from-layer="87" from-port="2" to-layer="88" to-port="1" /> <edge from-layer="88" from-port="2" to-layer="248" to-port="0" /> <edge from-layer="89" from-port="1" to-layer="91" to-port="0" /> <edge from-layer="90" from-port="0" to-layer="91" to-port="2" /> <edge from-layer="91" from-port="3" to-layer="127" to-port="0" /> <edge from-layer="91" from-port="3" to-layer="119" to-port="0" /> <edge from-layer="92" from-port="0" to-layer="93" to-port="0" /> <edge from-layer="93" from-port="1" to-layer="96" to-port="0" /> <edge from-layer="94" from-port="0" to-layer="95" to-port="0" /> <edge from-layer="95" from-port="1" to-layer="96" to-port="1" /> <edge from-layer="96" from-port="2" to-layer="98" to-port="0" /> <edge from-layer="97" from-port="0" to-layer="98" to-port="1" /> <edge from-layer="98" from-port="2" to-layer="99" to-port="0" /> <edge from-layer="99" from-port="1" to-layer="100" to-port="1" /> <edge from-layer="100" from-port="2" to-layer="102" to-port="0" /> <edge from-layer="101" from-port="0" to-layer="102" to-port="1" /> <edge from-layer="102" from-port="2" to-layer="104" to-port="0" /> <edge from-layer="103" from-port="0" to-layer="104" to-port="1" /> <edge from-layer="104" from-port="2" to-layer="115" to-port="0" /> <edge from-layer="104" from-port="2" to-layer="109" to-port="0" /> <edge from-layer="104" from-port="2" to-layer="105" to-port="0" /> <edge from-layer="105" from-port="2" to-layer="118" to-port="0" /> <edge from-layer="106" from-port="0" to-layer="109" to-port="1" /> <edge from-layer="107" from-port="0" to-layer="109" to-port="2" /> <edge from-layer="108" from-port="0" to-layer="109" to-port="3" /> <edge from-layer="109" from-port="5" to-layer="111" to-port="0" /> <edge from-layer="110" from-port="0" to-layer="111" to-port="1" /> <edge from-layer="111" from-port="2" to-layer="116" to-port="0" /> <edge from-layer="112" from-port="0" to-layer="115" to-port="1" /> <edge from-layer="113" from-port="0" to-layer="115" to-port="2" /> <edge from-layer="114" from-port="0" to-layer="115" to-port="3" /> <edge from-layer="115" from-port="5" to-layer="116" to-port="1" /> <edge from-layer="116" from-port="2" to-layer="117" to-port="0" /> <edge from-layer="117" from-port="2" to-layer="118" to-port="1" /> <edge from-layer="118" from-port="2" to-layer="119" to-port="1" /> <edge from-layer="119" from-port="2" to-layer="6182" to-port="0" /> <edge from-layer="119" from-port="2" to-layer="122" to-port="0" /> <edge from-layer="119" from-port="2" to-layer="121" to-port="0" /> <edge from-layer="120" from-port="0" to-layer="4489" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4468" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5999" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="6215" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4791" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="6211" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5525" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="400" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5978" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4770" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4619" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4640" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4338" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2203" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="121" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4317" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2505" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2807" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1771" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1750" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2677" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2656" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1620" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1616" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="232" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1457" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1436" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2526" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3562" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1306" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1285" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="832" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1155" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1134" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2375" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2354" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1004" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="853" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="983" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3864" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4166" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="379" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2224" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4036" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4015" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3130" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3411" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="681" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3109" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3885" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4187" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="702" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1922" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3432" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2979" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3734" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="1901" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3713" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2958" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3583" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2828" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5697" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3281" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2052" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5395" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="2073" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5072" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5374" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4921" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="161" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5093" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="3260" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5223" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5676" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5827" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="4942" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="551" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5244" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5546" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="530" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="5848" to-port="1" /> <edge from-layer="121" from-port="2" to-layer="141" to-port="0" /> <edge from-layer="122" from-port="1" to-layer="125" to-port="0" /> <edge from-layer="123" from-port="0" to-layer="125" to-port="1" /> <edge from-layer="124" from-port="0" to-layer="125" to-port="2" /> <edge from-layer="125" from-port="3" to-layer="140" to-port="0" /> <edge from-layer="126" from-port="0" to-layer="140" to-port="1" /> <edge from-layer="127" from-port="1" to-layer="130" to-port="0" /> <edge from-layer="128" from-port="0" to-layer="130" to-port="1" /> <edge from-layer="129" from-port="0" to-layer="130" to-port="2" /> <edge from-layer="130" from-port="3" to-layer="201" to-port="0" /> <edge from-layer="130" from-port="3" to-layer="199" to-port="0" /> <edge from-layer="130" from-port="3" to-layer="132" to-port="0" /> <edge from-layer="131" from-port="0" to-layer="132" to-port="1" /> <edge from-layer="132" from-port="2" to-layer="138" to-port="0" /> <edge from-layer="133" from-port="0" to-layer="135" to-port="1" /> <edge from-layer="134" from-port="0" to-layer="135" to-port="2" /> <edge from-layer="135" from-port="3" to-layer="137" to-port="0" /> <edge from-layer="135" from-port="3" to-layer="199" to-port="1" /> <edge from-layer="136" from-port="0" to-layer="137" to-port="1" /> <edge from-layer="137" from-port="2" to-layer="174" to-port="0" /> <edge from-layer="137" from-port="2" to-layer="138" to-port="1" /> <edge from-layer="138" from-port="2" to-layer="140" to-port="2" /> <edge from-layer="138" from-port="2" to-layer="247" to-port="2" /> <edge from-layer="139" from-port="0" to-layer="140" to-port="3" /> <edge from-layer="140" from-port="4" to-layer="4016" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5677" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1923" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="6216" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3865" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5224" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3886" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="162" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="380" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3110" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5698" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5094" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3412" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="682" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4037" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2225" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3282" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3131" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1156" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1617" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2527" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1458" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1437" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5396" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2506" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1307" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1286" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2376" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5375" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="833" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5547" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1135" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2355" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1005" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="854" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="984" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5526" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2829" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5245" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3433" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2980" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="141" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1902" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3714" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3735" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2959" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3584" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="703" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3563" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2808" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="3261" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1772" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1751" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2678" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2657" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="1621" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="531" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="6212" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5828" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="6000" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4167" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2074" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4922" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4620" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5849" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4641" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5073" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4490" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4771" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4469" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4943" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2204" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="552" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4188" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4318" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="401" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4792" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="4339" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="5979" to-port="1" /> <edge from-layer="140" from-port="4" to-layer="2053" to-port="1" /> <edge from-layer="141" from-port="2" to-layer="143" to-port="0" /> <edge from-layer="142" from-port="0" to-layer="143" to-port="1" /> <edge from-layer="143" from-port="2" to-layer="248" to-port="1" /> <edge from-layer="144" from-port="1" to-layer="146" to-port="0" /> <edge from-layer="145" from-port="0" to-layer="146" to-port="2" /> <edge from-layer="146" from-port="3" to-layer="160" to-port="0" /> <edge from-layer="147" from-port="0" to-layer="148" to-port="0" /> <edge from-layer="148" from-port="1" to-layer="151" to-port="0" /> <edge from-layer="149" from-port="0" to-layer="150" to-port="0" /> <edge from-layer="150" from-port="1" to-layer="151" to-port="1" /> <edge from-layer="151" from-port="2" to-layer="153" to-port="0" /> <edge from-layer="152" from-port="0" to-layer="153" to-port="1" /> <edge from-layer="153" from-port="2" to-layer="154" to-port="0" /> <edge from-layer="154" from-port="1" to-layer="155" to-port="1" /> <edge from-layer="155" from-port="2" to-layer="157" to-port="0" /> <edge from-layer="156" from-port="0" to-layer="157" to-port="1" /> <edge from-layer="157" from-port="2" to-layer="159" to-port="0" /> <edge from-layer="158" from-port="0" to-layer="159" to-port="1" /> <edge from-layer="159" from-port="2" to-layer="160" to-port="1" /> <edge from-layer="160" from-port="2" to-layer="6181" to-port="0" /> <edge from-layer="160" from-port="2" to-layer="161" to-port="0" /> <edge from-layer="161" from-port="2" to-layer="162" to-port="0" /> <edge from-layer="162" from-port="2" to-layer="164" to-port="0" /> <edge from-layer="163" from-port="0" to-layer="164" to-port="1" /> <edge from-layer="164" from-port="2" to-layer="248" to-port="2" /> <edge from-layer="165" from-port="0" to-layer="182" to-port="0" /> <edge from-layer="165" from-port="0" to-layer="183" to-port="1" /> <edge from-layer="166" from-port="0" to-layer="176" to-port="0" /> <edge from-layer="167" from-port="0" to-layer="175" to-port="0" /> <edge from-layer="168" from-port="1" to-layer="171" to-port="0" /> <edge from-layer="169" from-port="0" to-layer="171" to-port="1" /> <edge from-layer="170" from-port="0" to-layer="171" to-port="2" /> <edge from-layer="171" from-port="3" to-layer="173" to-port="0" /> <edge from-layer="171" from-port="3" to-layer="196" to-port="1" /> <edge from-layer="172" from-port="0" to-layer="173" to-port="1" /> <edge from-layer="173" from-port="2" to-layer="230" to-port="2" /> <edge from-layer="173" from-port="2" to-layer="225" to-port="2" /> <edge from-layer="173" from-port="2" to-layer="174" to-port="1" /> <edge from-layer="174" from-port="2" to-layer="175" to-port="1" /> <edge from-layer="175" from-port="2" to-layer="176" to-port="1" /> <edge from-layer="176" from-port="2" to-layer="193" to-port="1" /> <edge from-layer="176" from-port="2" to-layer="177" to-port="0" /> <edge from-layer="177" from-port="1" to-layer="187" to-port="0" /> <edge from-layer="177" from-port="1" to-layer="180" to-port="0" /> <edge from-layer="178" from-port="0" to-layer="180" to-port="1" /> <edge from-layer="179" from-port="0" to-layer="180" to-port="2" /> <edge from-layer="180" from-port="3" to-layer="182" to-port="1" /> <edge from-layer="181" from-port="0" to-layer="182" to-port="2" /> <edge from-layer="181" from-port="0" to-layer="189" to-port="2" /> <edge from-layer="181" from-port="0" to-layer="190" to-port="1" /> <edge from-layer="182" from-port="3" to-layer="183" to-port="0" /> <edge from-layer="183" from-port="2" to-layer="191" to-port="0" /> <edge from-layer="184" from-port="0" to-layer="189" to-port="0" /> <edge from-layer="184" from-port="0" to-layer="188" to-port="1" /> <edge from-layer="185" from-port="0" to-layer="187" to-port="1" /> <edge from-layer="186" from-port="0" to-layer="187" to-port="2" /> <edge from-layer="187" from-port="3" to-layer="188" to-port="0" /> <edge from-layer="188" from-port="2" to-layer="189" to-port="1" /> <edge from-layer="189" from-port="3" to-layer="190" to-port="0" /> <edge from-layer="190" from-port="2" to-layer="191" to-port="1" /> <edge from-layer="191" from-port="2" to-layer="193" to-port="0" /> <edge from-layer="192" from-port="0" to-layer="193" to-port="2" /> <edge from-layer="193" from-port="3" to-layer="206" to-port="0" /> <edge from-layer="194" from-port="0" to-layer="196" to-port="0" /> <edge from-layer="195" from-port="0" to-layer="196" to-port="2" /> <edge from-layer="196" from-port="3" to-layer="197" to-port="0" /> <edge from-layer="197" from-port="1" to-layer="198" to-port="0" /> <edge from-layer="198" from-port="1" to-layer="204" to-port="0" /> <edge from-layer="199" from-port="2" to-layer="201" to-port="1" /> <edge from-layer="200" from-port="0" to-layer="201" to-port="2" /> <edge from-layer="201" from-port="3" to-layer="203" to-port="0" /> <edge from-layer="202" from-port="0" to-layer="203" to-port="1" /> <edge from-layer="203" from-port="2" to-layer="204" to-port="1" /> <edge from-layer="204" from-port="2" to-layer="205" to-port="0" /> <edge from-layer="205" from-port="1" to-layer="206" to-port="1" /> <edge from-layer="206" from-port="2" to-layer="208" to-port="0" /> <edge from-layer="207" from-port="0" to-layer="208" to-port="1" /> <edge from-layer="208" from-port="2" to-layer="209" to-port="0" /> <edge from-layer="209" from-port="2" to-layer="214" to-port="0" /> <edge from-layer="210" from-port="0" to-layer="213" to-port="1" /> <edge from-layer="211" from-port="0" to-layer="213" to-port="2" /> <edge from-layer="212" from-port="0" to-layer="213" to-port="3" /> <edge from-layer="213" from-port="4" to-layer="214" to-port="1" /> <edge from-layer="214" from-port="2" to-layer="230" to-port="0" /> <edge from-layer="214" from-port="2" to-layer="218" to-port="0" /> <edge from-layer="214" from-port="2" to-layer="216" to-port="0" /> <edge from-layer="215" from-port="0" to-layer="216" to-port="1" /> <edge from-layer="216" from-port="2" to-layer="243" to-port="0" /> <edge from-layer="217" from-port="0" to-layer="219" to-port="1" /> <edge from-layer="217" from-port="0" to-layer="221" to-port="0" /> <edge from-layer="218" from-port="1" to-layer="244" to-port="1" /> <edge from-layer="218" from-port="1" to-layer="222" to-port="1" /> <edge from-layer="218" from-port="1" to-layer="219" to-port="0" /> <edge from-layer="219" from-port="2" to-layer="221" to-port="1" /> <edge from-layer="220" from-port="0" to-layer="221" to-port="2" /> <edge from-layer="221" from-port="3" to-layer="222" to-port="0" /> <edge from-layer="222" from-port="2" to-layer="225" to-port="0" /> <edge from-layer="223" from-port="0" to-layer="225" to-port="1" /> <edge from-layer="224" from-port="0" to-layer="225" to-port="3" /> <edge from-layer="225" from-port="5" to-layer="227" to-port="0" /> <edge from-layer="226" from-port="0" to-layer="227" to-port="1" /> <edge from-layer="227" from-port="2" to-layer="243" to-port="1" /> <edge from-layer="228" from-port="0" to-layer="230" to-port="1" /> <edge from-layer="229" from-port="0" to-layer="230" to-port="3" /> <edge from-layer="230" from-port="5" to-layer="234" to-port="0" /> <edge from-layer="230" from-port="5" to-layer="238" to-port="2" /> <edge from-layer="230" from-port="5" to-layer="239" to-port="0" /> <edge from-layer="231" from-port="2" to-layer="232" to-port="0" /> <edge from-layer="232" from-port="2" to-layer="233" to-port="0" /> <edge from-layer="233" from-port="1" to-layer="234" to-port="1" /> <edge from-layer="234" from-port="2" to-layer="236" to-port="0" /> <edge from-layer="235" from-port="0" to-layer="236" to-port="1" /> <edge from-layer="236" from-port="2" to-layer="238" to-port="0" /> <edge from-layer="237" from-port="0" to-layer="238" to-port="1" /> <edge from-layer="238" from-port="3" to-layer="240" to-port="0" /> <edge from-layer="239" from-port="1" to-layer="240" to-port="1" /> <edge from-layer="240" from-port="2" to-layer="242" to-port="0" /> <edge from-layer="241" from-port="0" to-layer="242" to-port="1" /> <edge from-layer="242" from-port="2" to-layer="243" to-port="2" /> <edge from-layer="243" from-port="3" to-layer="244" to-port="0" /> <edge from-layer="244" from-port="2" to-layer="247" to-port="0" /> <edge from-layer="245" from-port="0" to-layer="247" to-port="1" /> <edge from-layer="246" from-port="0" to-layer="247" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="4795" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="1775" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="2379" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="248" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="5399" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="1310" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="857" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="1159" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="2530" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="5852" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="4644" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="1461" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="5550" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="1008" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="2983" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="5097" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="4493" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="3587" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="4040" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="3134" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="3436" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="3738" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="5701" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="2832" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="2228" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="5248" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="706" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="4946" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="3889" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="1926" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="4342" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="6003" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="2077" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="1624" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="6219" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="555" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="3285" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="404" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="2681" to-port="3" /> <edge from-layer="247" from-port="5" to-layer="4191" to-port="3" /> <edge from-layer="248" from-port="4" to-layer="250" to-port="0" /> <edge from-layer="249" from-port="0" to-layer="250" to-port="1" /> <edge from-layer="250" from-port="2" to-layer="256" to-port="0" /> <edge from-layer="251" from-port="0" to-layer="253" to-port="1" /> <edge from-layer="252" from-port="0" to-layer="253" to-port="2" /> <edge from-layer="253" from-port="3" to-layer="255" to-port="0" /> <edge from-layer="254" from-port="0" to-layer="255" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="1929" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="3288" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="3892" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="860" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="2231" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="4798" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="5704" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="256" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="2080" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="1011" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="4194" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="5855" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="2533" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="4043" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="5100" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="6222" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="3137" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="1162" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="1627" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="1464" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="407" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="558" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="1778" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="2684" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="4496" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="5402" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="1313" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="3590" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="2835" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="4647" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="6006" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="3439" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="5553" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="2986" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="2382" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="4949" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="709" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="5251" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="4345" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="3741" to-port="1" /> <edge from-layer="256" from-port="2" to-layer="265" to-port="0" /> <edge from-layer="257" from-port="0" to-layer="258" to-port="0" /> <edge from-layer="258" from-port="1" to-layer="261" to-port="0" /> <edge from-layer="259" from-port="0" to-layer="260" to-port="0" /> <edge from-layer="260" from-port="1" to-layer="261" to-port="1" /> <edge from-layer="261" from-port="2" to-layer="263" to-port="0" /> <edge from-layer="262" from-port="0" to-layer="263" to-port="1" /> <edge from-layer="263" from-port="2" to-layer="264" to-port="0" /> <edge from-layer="264" from-port="1" to-layer="265" to-port="1" /> <edge from-layer="265" from-port="2" to-layer="266" to-port="1" /> <edge from-layer="266" from-port="2" to-layer="277" to-port="0" /> <edge from-layer="266" from-port="2" to-layer="270" to-port="0" /> <edge from-layer="266" from-port="2" to-layer="308" to-port="0" /> <edge from-layer="267" from-port="0" to-layer="278" to-port="0" /> <edge from-layer="268" from-port="0" to-layer="276" to-port="0" /> <edge from-layer="269" from-port="0" to-layer="270" to-port="1" /> <edge from-layer="270" from-port="2" to-layer="272" to-port="0" /> <edge from-layer="271" from-port="0" to-layer="272" to-port="1" /> <edge from-layer="272" from-port="2" to-layer="274" to-port="0" /> <edge from-layer="273" from-port="0" to-layer="274" to-port="1" /> <edge from-layer="274" from-port="2" to-layer="275" to-port="0" /> <edge from-layer="275" from-port="1" to-layer="276" to-port="1" /> <edge from-layer="276" from-port="2" to-layer="277" to-port="1" /> <edge from-layer="277" from-port="2" to-layer="278" to-port="1" /> <edge from-layer="278" from-port="2" to-layer="287" to-port="0" /> <edge from-layer="278" from-port="2" to-layer="297" to-port="0" /> <edge from-layer="279" from-port="0" to-layer="280" to-port="0" /> <edge from-layer="280" from-port="1" to-layer="283" to-port="0" /> <edge from-layer="281" from-port="0" to-layer="282" to-port="0" /> <edge from-layer="282" from-port="1" to-layer="283" to-port="1" /> <edge from-layer="283" from-port="2" to-layer="285" to-port="0" /> <edge from-layer="284" from-port="0" to-layer="285" to-port="1" /> <edge from-layer="285" from-port="2" to-layer="286" to-port="0" /> <edge from-layer="286" from-port="1" to-layer="287" to-port="1" /> <edge from-layer="287" from-port="2" to-layer="288" to-port="0" /> <edge from-layer="288" from-port="1" to-layer="298" to-port="0" /> <edge from-layer="289" from-port="0" to-layer="290" to-port="0" /> <edge from-layer="290" from-port="1" to-layer="293" to-port="0" /> <edge from-layer="291" from-port="0" to-layer="292" to-port="0" /> <edge from-layer="292" from-port="1" to-layer="293" to-port="1" /> <edge from-layer="293" from-port="2" to-layer="295" to-port="0" /> <edge from-layer="294" from-port="0" to-layer="295" to-port="1" /> <edge from-layer="295" from-port="2" to-layer="296" to-port="0" /> <edge from-layer="296" from-port="1" to-layer="297" to-port="1" /> <edge from-layer="297" from-port="2" to-layer="298" to-port="1" /> <edge from-layer="298" from-port="2" to-layer="307" to-port="0" /> <edge from-layer="299" from-port="0" to-layer="300" to-port="0" /> <edge from-layer="300" from-port="1" to-layer="303" to-port="0" /> <edge from-layer="301" from-port="0" to-layer="302" to-port="0" /> <edge from-layer="302" from-port="1" to-layer="303" to-port="1" /> <edge from-layer="303" from-port="2" to-layer="305" to-port="0" /> <edge from-layer="304" from-port="0" to-layer="305" to-port="1" /> <edge from-layer="305" from-port="2" to-layer="306" to-port="0" /> <edge from-layer="306" from-port="1" to-layer="307" to-port="1" /> <edge from-layer="307" from-port="2" to-layer="308" to-port="1" /> <edge from-layer="308" from-port="2" to-layer="319" to-port="0" /> <edge from-layer="308" from-port="2" to-layer="417" to-port="0" /> <edge from-layer="308" from-port="2" to-layer="312" to-port="0" /> <edge from-layer="309" from-port="0" to-layer="320" to-port="0" /> <edge from-layer="310" from-port="0" to-layer="318" to-port="0" /> <edge from-layer="311" from-port="0" to-layer="312" to-port="1" /> <edge from-layer="312" from-port="2" to-layer="314" to-port="0" /> <edge from-layer="313" from-port="0" to-layer="314" to-port="1" /> <edge from-layer="314" from-port="2" to-layer="316" to-port="0" /> <edge from-layer="315" from-port="0" to-layer="316" to-port="1" /> <edge from-layer="316" from-port="2" to-layer="317" to-port="0" /> <edge from-layer="317" from-port="1" to-layer="318" to-port="1" /> <edge from-layer="318" from-port="2" to-layer="319" to-port="1" /> <edge from-layer="319" from-port="2" to-layer="320" to-port="1" /> <edge from-layer="320" from-port="2" to-layer="329" to-port="0" /> <edge from-layer="320" from-port="2" to-layer="359" to-port="0" /> <edge from-layer="320" from-port="2" to-layer="394" to-port="0" /> <edge from-layer="321" from-port="0" to-layer="322" to-port="0" /> <edge from-layer="322" from-port="1" to-layer="325" to-port="0" /> <edge from-layer="323" from-port="0" to-layer="324" to-port="0" /> <edge from-layer="324" from-port="1" to-layer="325" to-port="1" /> <edge from-layer="325" from-port="2" to-layer="327" to-port="0" /> <edge from-layer="326" from-port="0" to-layer="327" to-port="1" /> <edge from-layer="327" from-port="2" to-layer="328" to-port="0" /> <edge from-layer="328" from-port="1" to-layer="329" to-port="1" /> <edge from-layer="329" from-port="2" to-layer="331" to-port="0" /> <edge from-layer="330" from-port="0" to-layer="331" to-port="1" /> <edge from-layer="331" from-port="2" to-layer="333" to-port="0" /> <edge from-layer="332" from-port="0" to-layer="333" to-port="1" /> <edge from-layer="333" from-port="2" to-layer="334" to-port="0" /> <edge from-layer="333" from-port="2" to-layer="338" to-port="0" /> <edge from-layer="333" from-port="2" to-layer="344" to-port="0" /> <edge from-layer="334" from-port="2" to-layer="347" to-port="0" /> <edge from-layer="335" from-port="0" to-layer="338" to-port="1" /> <edge from-layer="336" from-port="0" to-layer="338" to-port="2" /> <edge from-layer="337" from-port="0" to-layer="338" to-port="3" /> <edge from-layer="338" from-port="5" to-layer="340" to-port="0" /> <edge from-layer="339" from-port="0" to-layer="340" to-port="1" /> <edge from-layer="340" from-port="2" to-layer="345" to-port="0" /> <edge from-layer="341" from-port="0" to-layer="344" to-port="1" /> <edge from-layer="342" from-port="0" to-layer="344" to-port="2" /> <edge from-layer="343" from-port="0" to-layer="344" to-port="3" /> <edge from-layer="344" from-port="5" to-layer="345" to-port="1" /> <edge from-layer="345" from-port="2" to-layer="346" to-port="0" /> <edge from-layer="346" from-port="2" to-layer="347" to-port="1" /> <edge from-layer="347" from-port="2" to-layer="404" to-port="0" /> <edge from-layer="348" from-port="1" to-layer="350" to-port="0" /> <edge from-layer="349" from-port="0" to-layer="350" to-port="2" /> <edge from-layer="350" from-port="3" to-layer="378" to-port="0" /> <edge from-layer="351" from-port="0" to-layer="352" to-port="0" /> <edge from-layer="352" from-port="1" to-layer="355" to-port="0" /> <edge from-layer="353" from-port="0" to-layer="354" to-port="0" /> <edge from-layer="354" from-port="1" to-layer="355" to-port="1" /> <edge from-layer="355" from-port="2" to-layer="357" to-port="0" /> <edge from-layer="356" from-port="0" to-layer="357" to-port="1" /> <edge from-layer="357" from-port="2" to-layer="358" to-port="0" /> <edge from-layer="358" from-port="1" to-layer="359" to-port="1" /> <edge from-layer="359" from-port="2" to-layer="361" to-port="0" /> <edge from-layer="360" from-port="0" to-layer="361" to-port="1" /> <edge from-layer="361" from-port="2" to-layer="363" to-port="0" /> <edge from-layer="362" from-port="0" to-layer="363" to-port="1" /> <edge from-layer="363" from-port="2" to-layer="364" to-port="0" /> <edge from-layer="363" from-port="2" to-layer="368" to-port="0" /> <edge from-layer="363" from-port="2" to-layer="374" to-port="0" /> <edge from-layer="364" from-port="2" to-layer="377" to-port="0" /> <edge from-layer="365" from-port="0" to-layer="368" to-port="1" /> <edge from-layer="366" from-port="0" to-layer="368" to-port="2" /> <edge from-layer="367" from-port="0" to-layer="368" to-port="3" /> <edge from-layer="368" from-port="5" to-layer="370" to-port="0" /> <edge from-layer="369" from-port="0" to-layer="370" to-port="1" /> <edge from-layer="370" from-port="2" to-layer="375" to-port="0" /> <edge from-layer="371" from-port="0" to-layer="374" to-port="1" /> <edge from-layer="372" from-port="0" to-layer="374" to-port="2" /> <edge from-layer="373" from-port="0" to-layer="374" to-port="3" /> <edge from-layer="374" from-port="5" to-layer="375" to-port="1" /> <edge from-layer="375" from-port="2" to-layer="376" to-port="0" /> <edge from-layer="376" from-port="2" to-layer="377" to-port="1" /> <edge from-layer="377" from-port="2" to-layer="378" to-port="1" /> <edge from-layer="378" from-port="2" to-layer="6180" to-port="0" /> <edge from-layer="378" from-port="2" to-layer="379" to-port="0" /> <edge from-layer="379" from-port="2" to-layer="380" to-port="0" /> <edge from-layer="380" from-port="2" to-layer="382" to-port="0" /> <edge from-layer="381" from-port="0" to-layer="382" to-port="1" /> <edge from-layer="382" from-port="2" to-layer="404" to-port="1" /> <edge from-layer="383" from-port="1" to-layer="385" to-port="0" /> <edge from-layer="384" from-port="0" to-layer="385" to-port="2" /> <edge from-layer="385" from-port="3" to-layer="399" to-port="0" /> <edge from-layer="386" from-port="0" to-layer="387" to-port="0" /> <edge from-layer="387" from-port="1" to-layer="390" to-port="0" /> <edge from-layer="388" from-port="0" to-layer="389" to-port="0" /> <edge from-layer="389" from-port="1" to-layer="390" to-port="1" /> <edge from-layer="390" from-port="2" to-layer="392" to-port="0" /> <edge from-layer="391" from-port="0" to-layer="392" to-port="1" /> <edge from-layer="392" from-port="2" to-layer="393" to-port="0" /> <edge from-layer="393" from-port="1" to-layer="394" to-port="1" /> <edge from-layer="394" from-port="2" to-layer="396" to-port="0" /> <edge from-layer="395" from-port="0" to-layer="396" to-port="1" /> <edge from-layer="396" from-port="2" to-layer="398" to-port="0" /> <edge from-layer="397" from-port="0" to-layer="398" to-port="1" /> <edge from-layer="398" from-port="2" to-layer="399" to-port="1" /> <edge from-layer="399" from-port="2" to-layer="6179" to-port="0" /> <edge from-layer="399" from-port="2" to-layer="400" to-port="0" /> <edge from-layer="400" from-port="2" to-layer="401" to-port="0" /> <edge from-layer="401" from-port="2" to-layer="403" to-port="0" /> <edge from-layer="402" from-port="0" to-layer="403" to-port="1" /> <edge from-layer="403" from-port="2" to-layer="404" to-port="2" /> <edge from-layer="404" from-port="4" to-layer="406" to-port="0" /> <edge from-layer="405" from-port="0" to-layer="406" to-port="1" /> <edge from-layer="406" from-port="2" to-layer="407" to-port="0" /> <edge from-layer="407" from-port="2" to-layer="416" to-port="0" /> <edge from-layer="408" from-port="0" to-layer="409" to-port="0" /> <edge from-layer="409" from-port="1" to-layer="412" to-port="0" /> <edge from-layer="410" from-port="0" to-layer="411" to-port="0" /> <edge from-layer="411" from-port="1" to-layer="412" to-port="1" /> <edge from-layer="412" from-port="2" to-layer="414" to-port="0" /> <edge from-layer="413" from-port="0" to-layer="414" to-port="1" /> <edge from-layer="414" from-port="2" to-layer="415" to-port="0" /> <edge from-layer="415" from-port="1" to-layer="416" to-port="1" /> <edge from-layer="416" from-port="2" to-layer="417" to-port="1" /> <edge from-layer="417" from-port="2" to-layer="428" to-port="0" /> <edge from-layer="417" from-port="2" to-layer="421" to-port="0" /> <edge from-layer="417" from-port="2" to-layer="459" to-port="0" /> <edge from-layer="418" from-port="0" to-layer="429" to-port="0" /> <edge from-layer="419" from-port="0" to-layer="427" to-port="0" /> <edge from-layer="420" from-port="0" to-layer="421" to-port="1" /> <edge from-layer="421" from-port="2" to-layer="423" to-port="0" /> <edge from-layer="422" from-port="0" to-layer="423" to-port="1" /> <edge from-layer="423" from-port="2" to-layer="425" to-port="0" /> <edge from-layer="424" from-port="0" to-layer="425" to-port="1" /> <edge from-layer="425" from-port="2" to-layer="426" to-port="0" /> <edge from-layer="426" from-port="1" to-layer="427" to-port="1" /> <edge from-layer="427" from-port="2" to-layer="428" to-port="1" /> <edge from-layer="428" from-port="2" to-layer="429" to-port="1" /> <edge from-layer="429" from-port="2" to-layer="438" to-port="0" /> <edge from-layer="429" from-port="2" to-layer="448" to-port="0" /> <edge from-layer="430" from-port="0" to-layer="431" to-port="0" /> <edge from-layer="431" from-port="1" to-layer="434" to-port="0" /> <edge from-layer="432" from-port="0" to-layer="433" to-port="0" /> <edge from-layer="433" from-port="1" to-layer="434" to-port="1" /> <edge from-layer="434" from-port="2" to-layer="436" to-port="0" /> <edge from-layer="435" from-port="0" to-layer="436" to-port="1" /> <edge from-layer="436" from-port="2" to-layer="437" to-port="0" /> <edge from-layer="437" from-port="1" to-layer="438" to-port="1" /> <edge from-layer="438" from-port="2" to-layer="439" to-port="0" /> <edge from-layer="439" from-port="1" to-layer="449" to-port="0" /> <edge from-layer="440" from-port="0" to-layer="441" to-port="0" /> <edge from-layer="441" from-port="1" to-layer="444" to-port="0" /> <edge from-layer="442" from-port="0" to-layer="443" to-port="0" /> <edge from-layer="443" from-port="1" to-layer="444" to-port="1" /> <edge from-layer="444" from-port="2" to-layer="446" to-port="0" /> <edge from-layer="445" from-port="0" to-layer="446" to-port="1" /> <edge from-layer="446" from-port="2" to-layer="447" to-port="0" /> <edge from-layer="447" from-port="1" to-layer="448" to-port="1" /> <edge from-layer="448" from-port="2" to-layer="449" to-port="1" /> <edge from-layer="449" from-port="2" to-layer="458" to-port="0" /> <edge from-layer="450" from-port="0" to-layer="451" to-port="0" /> <edge from-layer="451" from-port="1" to-layer="454" to-port="0" /> <edge from-layer="452" from-port="0" to-layer="453" to-port="0" /> <edge from-layer="453" from-port="1" to-layer="454" to-port="1" /> <edge from-layer="454" from-port="2" to-layer="456" to-port="0" /> <edge from-layer="455" from-port="0" to-layer="456" to-port="1" /> <edge from-layer="456" from-port="2" to-layer="457" to-port="0" /> <edge from-layer="457" from-port="1" to-layer="458" to-port="1" /> <edge from-layer="458" from-port="2" to-layer="459" to-port="1" /> <edge from-layer="459" from-port="2" to-layer="463" to-port="0" /> <edge from-layer="459" from-port="2" to-layer="470" to-port="0" /> <edge from-layer="459" from-port="2" to-layer="568" to-port="0" /> <edge from-layer="460" from-port="0" to-layer="471" to-port="0" /> <edge from-layer="461" from-port="0" to-layer="469" to-port="0" /> <edge from-layer="462" from-port="0" to-layer="463" to-port="1" /> <edge from-layer="463" from-port="2" to-layer="465" to-port="0" /> <edge from-layer="464" from-port="0" to-layer="465" to-port="1" /> <edge from-layer="465" from-port="2" to-layer="467" to-port="0" /> <edge from-layer="466" from-port="0" to-layer="467" to-port="1" /> <edge from-layer="467" from-port="2" to-layer="468" to-port="0" /> <edge from-layer="468" from-port="1" to-layer="469" to-port="1" /> <edge from-layer="469" from-port="2" to-layer="470" to-port="1" /> <edge from-layer="470" from-port="2" to-layer="471" to-port="1" /> <edge from-layer="471" from-port="2" to-layer="480" to-port="0" /> <edge from-layer="471" from-port="2" to-layer="510" to-port="0" /> <edge from-layer="471" from-port="2" to-layer="545" to-port="0" /> <edge from-layer="472" from-port="0" to-layer="473" to-port="0" /> <edge from-layer="473" from-port="1" to-layer="476" to-port="0" /> <edge from-layer="474" from-port="0" to-layer="475" to-port="0" /> <edge from-layer="475" from-port="1" to-layer="476" to-port="1" /> <edge from-layer="476" from-port="2" to-layer="478" to-port="0" /> <edge from-layer="477" from-port="0" to-layer="478" to-port="1" /> <edge from-layer="478" from-port="2" to-layer="479" to-port="0" /> <edge from-layer="479" from-port="1" to-layer="480" to-port="1" /> <edge from-layer="480" from-port="2" to-layer="482" to-port="0" /> <edge from-layer="481" from-port="0" to-layer="482" to-port="1" /> <edge from-layer="482" from-port="2" to-layer="484" to-port="0" /> <edge from-layer="483" from-port="0" to-layer="484" to-port="1" /> <edge from-layer="484" from-port="2" to-layer="485" to-port="0" /> <edge from-layer="484" from-port="2" to-layer="489" to-port="0" /> <edge from-layer="484" from-port="2" to-layer="495" to-port="0" /> <edge from-layer="485" from-port="2" to-layer="498" to-port="0" /> <edge from-layer="486" from-port="0" to-layer="489" to-port="1" /> <edge from-layer="487" from-port="0" to-layer="489" to-port="2" /> <edge from-layer="488" from-port="0" to-layer="489" to-port="3" /> <edge from-layer="489" from-port="5" to-layer="491" to-port="0" /> <edge from-layer="490" from-port="0" to-layer="491" to-port="1" /> <edge from-layer="491" from-port="2" to-layer="496" to-port="0" /> <edge from-layer="492" from-port="0" to-layer="495" to-port="1" /> <edge from-layer="493" from-port="0" to-layer="495" to-port="2" /> <edge from-layer="494" from-port="0" to-layer="495" to-port="3" /> <edge from-layer="495" from-port="5" to-layer="496" to-port="1" /> <edge from-layer="496" from-port="2" to-layer="497" to-port="0" /> <edge from-layer="497" from-port="2" to-layer="498" to-port="1" /> <edge from-layer="498" from-port="2" to-layer="555" to-port="0" /> <edge from-layer="499" from-port="1" to-layer="501" to-port="0" /> <edge from-layer="500" from-port="0" to-layer="501" to-port="2" /> <edge from-layer="501" from-port="3" to-layer="529" to-port="0" /> <edge from-layer="502" from-port="0" to-layer="503" to-port="0" /> <edge from-layer="503" from-port="1" to-layer="506" to-port="0" /> <edge from-layer="504" from-port="0" to-layer="505" to-port="0" /> <edge from-layer="505" from-port="1" to-layer="506" to-port="1" /> <edge from-layer="506" from-port="2" to-layer="508" to-port="0" /> <edge from-layer="507" from-port="0" to-layer="508" to-port="1" /> <edge from-layer="508" from-port="2" to-layer="509" to-port="0" /> <edge from-layer="509" from-port="1" to-layer="510" to-port="1" /> <edge from-layer="510" from-port="2" to-layer="512" to-port="0" /> <edge from-layer="511" from-port="0" to-layer="512" to-port="1" /> <edge from-layer="512" from-port="2" to-layer="514" to-port="0" /> <edge from-layer="513" from-port="0" to-layer="514" to-port="1" /> <edge from-layer="514" from-port="2" to-layer="515" to-port="0" /> <edge from-layer="514" from-port="2" to-layer="519" to-port="0" /> <edge from-layer="514" from-port="2" to-layer="525" to-port="0" /> <edge from-layer="515" from-port="2" to-layer="528" to-port="0" /> <edge from-layer="516" from-port="0" to-layer="519" to-port="1" /> <edge from-layer="517" from-port="0" to-layer="519" to-port="2" /> <edge from-layer="518" from-port="0" to-layer="519" to-port="3" /> <edge from-layer="519" from-port="5" to-layer="521" to-port="0" /> <edge from-layer="520" from-port="0" to-layer="521" to-port="1" /> <edge from-layer="521" from-port="2" to-layer="526" to-port="0" /> <edge from-layer="522" from-port="0" to-layer="525" to-port="1" /> <edge from-layer="523" from-port="0" to-layer="525" to-port="2" /> <edge from-layer="524" from-port="0" to-layer="525" to-port="3" /> <edge from-layer="525" from-port="5" to-layer="526" to-port="1" /> <edge from-layer="526" from-port="2" to-layer="527" to-port="0" /> <edge from-layer="527" from-port="2" to-layer="528" to-port="1" /> <edge from-layer="528" from-port="2" to-layer="529" to-port="1" /> <edge from-layer="529" from-port="2" to-layer="6158" to-port="0" /> <edge from-layer="529" from-port="2" to-layer="530" to-port="0" /> <edge from-layer="530" from-port="2" to-layer="531" to-port="0" /> <edge from-layer="531" from-port="2" to-layer="533" to-port="0" /> <edge from-layer="532" from-port="0" to-layer="533" to-port="1" /> <edge from-layer="533" from-port="2" to-layer="555" to-port="1" /> <edge from-layer="534" from-port="1" to-layer="536" to-port="0" /> <edge from-layer="535" from-port="0" to-layer="536" to-port="2" /> <edge from-layer="536" from-port="3" to-layer="550" to-port="0" /> <edge from-layer="537" from-port="0" to-layer="538" to-port="0" /> <edge from-layer="538" from-port="1" to-layer="541" to-port="0" /> <edge from-layer="539" from-port="0" to-layer="540" to-port="0" /> <edge from-layer="540" from-port="1" to-layer="541" to-port="1" /> <edge from-layer="541" from-port="2" to-layer="543" to-port="0" /> <edge from-layer="542" from-port="0" to-layer="543" to-port="1" /> <edge from-layer="543" from-port="2" to-layer="544" to-port="0" /> <edge from-layer="544" from-port="1" to-layer="545" to-port="1" /> <edge from-layer="545" from-port="2" to-layer="547" to-port="0" /> <edge from-layer="546" from-port="0" to-layer="547" to-port="1" /> <edge from-layer="547" from-port="2" to-layer="549" to-port="0" /> <edge from-layer="548" from-port="0" to-layer="549" to-port="1" /> <edge from-layer="549" from-port="2" to-layer="550" to-port="1" /> <edge from-layer="550" from-port="2" to-layer="6157" to-port="0" /> <edge from-layer="550" from-port="2" to-layer="551" to-port="0" /> <edge from-layer="551" from-port="2" to-layer="552" to-port="0" /> <edge from-layer="552" from-port="2" to-layer="554" to-port="0" /> <edge from-layer="553" from-port="0" to-layer="554" to-port="1" /> <edge from-layer="554" from-port="2" to-layer="555" to-port="2" /> <edge from-layer="555" from-port="4" to-layer="557" to-port="0" /> <edge from-layer="556" from-port="0" to-layer="557" to-port="1" /> <edge from-layer="557" from-port="2" to-layer="558" to-port="0" /> <edge from-layer="558" from-port="2" to-layer="567" to-port="0" /> <edge from-layer="559" from-port="0" to-layer="560" to-port="0" /> <edge from-layer="560" from-port="1" to-layer="563" to-port="0" /> <edge from-layer="561" from-port="0" to-layer="562" to-port="0" /> <edge from-layer="562" from-port="1" to-layer="563" to-port="1" /> <edge from-layer="563" from-port="2" to-layer="565" to-port="0" /> <edge from-layer="564" from-port="0" to-layer="565" to-port="1" /> <edge from-layer="565" from-port="2" to-layer="566" to-port="0" /> <edge from-layer="566" from-port="1" to-layer="567" to-port="1" /> <edge from-layer="567" from-port="2" to-layer="568" to-port="1" /> <edge from-layer="568" from-port="2" to-layer="572" to-port="0" /> <edge from-layer="568" from-port="2" to-layer="610" to-port="0" /> <edge from-layer="568" from-port="2" to-layer="579" to-port="0" /> <edge from-layer="569" from-port="0" to-layer="580" to-port="0" /> <edge from-layer="570" from-port="0" to-layer="578" to-port="0" /> <edge from-layer="571" from-port="0" to-layer="572" to-port="1" /> <edge from-layer="572" from-port="2" to-layer="574" to-port="0" /> <edge from-layer="573" from-port="0" to-layer="574" to-port="1" /> <edge from-layer="574" from-port="2" to-layer="576" to-port="0" /> <edge from-layer="575" from-port="0" to-layer="576" to-port="1" /> <edge from-layer="576" from-port="2" to-layer="577" to-port="0" /> <edge from-layer="577" from-port="1" to-layer="578" to-port="1" /> <edge from-layer="578" from-port="2" to-layer="579" to-port="1" /> <edge from-layer="579" from-port="2" to-layer="580" to-port="1" /> <edge from-layer="580" from-port="2" to-layer="599" to-port="0" /> <edge from-layer="580" from-port="2" to-layer="589" to-port="0" /> <edge from-layer="581" from-port="0" to-layer="582" to-port="0" /> <edge from-layer="582" from-port="1" to-layer="585" to-port="0" /> <edge from-layer="583" from-port="0" to-layer="584" to-port="0" /> <edge from-layer="584" from-port="1" to-layer="585" to-port="1" /> <edge from-layer="585" from-port="2" to-layer="587" to-port="0" /> <edge from-layer="586" from-port="0" to-layer="587" to-port="1" /> <edge from-layer="587" from-port="2" to-layer="588" to-port="0" /> <edge from-layer="588" from-port="1" to-layer="589" to-port="1" /> <edge from-layer="589" from-port="2" to-layer="590" to-port="0" /> <edge from-layer="590" from-port="1" to-layer="600" to-port="0" /> <edge from-layer="591" from-port="0" to-layer="592" to-port="0" /> <edge from-layer="592" from-port="1" to-layer="595" to-port="0" /> <edge from-layer="593" from-port="0" to-layer="594" to-port="0" /> <edge from-layer="594" from-port="1" to-layer="595" to-port="1" /> <edge from-layer="595" from-port="2" to-layer="597" to-port="0" /> <edge from-layer="596" from-port="0" to-layer="597" to-port="1" /> <edge from-layer="597" from-port="2" to-layer="598" to-port="0" /> <edge from-layer="598" from-port="1" to-layer="599" to-port="1" /> <edge from-layer="599" from-port="2" to-layer="600" to-port="1" /> <edge from-layer="600" from-port="2" to-layer="609" to-port="0" /> <edge from-layer="601" from-port="0" to-layer="602" to-port="0" /> <edge from-layer="602" from-port="1" to-layer="605" to-port="0" /> <edge from-layer="603" from-port="0" to-layer="604" to-port="0" /> <edge from-layer="604" from-port="1" to-layer="605" to-port="1" /> <edge from-layer="605" from-port="2" to-layer="607" to-port="0" /> <edge from-layer="606" from-port="0" to-layer="607" to-port="1" /> <edge from-layer="607" from-port="2" to-layer="608" to-port="0" /> <edge from-layer="608" from-port="1" to-layer="609" to-port="1" /> <edge from-layer="609" from-port="2" to-layer="610" to-port="1" /> <edge from-layer="610" from-port="2" to-layer="621" to-port="0" /> <edge from-layer="610" from-port="2" to-layer="614" to-port="0" /> <edge from-layer="610" from-port="2" to-layer="719" to-port="0" /> <edge from-layer="611" from-port="0" to-layer="622" to-port="0" /> <edge from-layer="612" from-port="0" to-layer="620" to-port="0" /> <edge from-layer="613" from-port="0" to-layer="614" to-port="1" /> <edge from-layer="614" from-port="2" to-layer="616" to-port="0" /> <edge from-layer="615" from-port="0" to-layer="616" to-port="1" /> <edge from-layer="616" from-port="2" to-layer="618" to-port="0" /> <edge from-layer="617" from-port="0" to-layer="618" to-port="1" /> <edge from-layer="618" from-port="2" to-layer="619" to-port="0" /> <edge from-layer="619" from-port="1" to-layer="620" to-port="1" /> <edge from-layer="620" from-port="2" to-layer="621" to-port="1" /> <edge from-layer="621" from-port="2" to-layer="622" to-port="1" /> <edge from-layer="622" from-port="2" to-layer="631" to-port="0" /> <edge from-layer="622" from-port="2" to-layer="661" to-port="0" /> <edge from-layer="622" from-port="2" to-layer="696" to-port="0" /> <edge from-layer="623" from-port="0" to-layer="624" to-port="0" /> <edge from-layer="624" from-port="1" to-layer="627" to-port="0" /> <edge from-layer="625" from-port="0" to-layer="626" to-port="0" /> <edge from-layer="626" from-port="1" to-layer="627" to-port="1" /> <edge from-layer="627" from-port="2" to-layer="629" to-port="0" /> <edge from-layer="628" from-port="0" to-layer="629" to-port="1" /> <edge from-layer="629" from-port="2" to-layer="630" to-port="0" /> <edge from-layer="630" from-port="1" to-layer="631" to-port="1" /> <edge from-layer="631" from-port="2" to-layer="633" to-port="0" /> <edge from-layer="632" from-port="0" to-layer="633" to-port="1" /> <edge from-layer="633" from-port="2" to-layer="635" to-port="0" /> <edge from-layer="634" from-port="0" to-layer="635" to-port="1" /> <edge from-layer="635" from-port="2" to-layer="646" to-port="0" /> <edge from-layer="635" from-port="2" to-layer="636" to-port="0" /> <edge from-layer="635" from-port="2" to-layer="640" to-port="0" /> <edge from-layer="636" from-port="2" to-layer="649" to-port="0" /> <edge from-layer="637" from-port="0" to-layer="640" to-port="1" /> <edge from-layer="638" from-port="0" to-layer="640" to-port="2" /> <edge from-layer="639" from-port="0" to-layer="640" to-port="3" /> <edge from-layer="640" from-port="5" to-layer="642" to-port="0" /> <edge from-layer="641" from-port="0" to-layer="642" to-port="1" /> <edge from-layer="642" from-port="2" to-layer="647" to-port="0" /> <edge from-layer="643" from-port="0" to-layer="646" to-port="1" /> <edge from-layer="644" from-port="0" to-layer="646" to-port="2" /> <edge from-layer="645" from-port="0" to-layer="646" to-port="3" /> <edge from-layer="646" from-port="5" to-layer="647" to-port="1" /> <edge from-layer="647" from-port="2" to-layer="648" to-port="0" /> <edge from-layer="648" from-port="2" to-layer="649" to-port="1" /> <edge from-layer="649" from-port="2" to-layer="706" to-port="0" /> <edge from-layer="650" from-port="1" to-layer="652" to-port="0" /> <edge from-layer="651" from-port="0" to-layer="652" to-port="2" /> <edge from-layer="652" from-port="3" to-layer="680" to-port="0" /> <edge from-layer="653" from-port="0" to-layer="654" to-port="0" /> <edge from-layer="654" from-port="1" to-layer="657" to-port="0" /> <edge from-layer="655" from-port="0" to-layer="656" to-port="0" /> <edge from-layer="656" from-port="1" to-layer="657" to-port="1" /> <edge from-layer="657" from-port="2" to-layer="659" to-port="0" /> <edge from-layer="658" from-port="0" to-layer="659" to-port="1" /> <edge from-layer="659" from-port="2" to-layer="660" to-port="0" /> <edge from-layer="660" from-port="1" to-layer="661" to-port="1" /> <edge from-layer="661" from-port="2" to-layer="663" to-port="0" /> <edge from-layer="662" from-port="0" to-layer="663" to-port="1" /> <edge from-layer="663" from-port="2" to-layer="665" to-port="0" /> <edge from-layer="664" from-port="0" to-layer="665" to-port="1" /> <edge from-layer="665" from-port="2" to-layer="676" to-port="0" /> <edge from-layer="665" from-port="2" to-layer="666" to-port="0" /> <edge from-layer="665" from-port="2" to-layer="670" to-port="0" /> <edge from-layer="666" from-port="2" to-layer="679" to-port="0" /> <edge from-layer="667" from-port="0" to-layer="670" to-port="1" /> <edge from-layer="668" from-port="0" to-layer="670" to-port="2" /> <edge from-layer="669" from-port="0" to-layer="670" to-port="3" /> <edge from-layer="670" from-port="5" to-layer="672" to-port="0" /> <edge from-layer="671" from-port="0" to-layer="672" to-port="1" /> <edge from-layer="672" from-port="2" to-layer="677" to-port="0" /> <edge from-layer="673" from-port="0" to-layer="676" to-port="1" /> <edge from-layer="674" from-port="0" to-layer="676" to-port="2" /> <edge from-layer="675" from-port="0" to-layer="676" to-port="3" /> <edge from-layer="676" from-port="5" to-layer="677" to-port="1" /> <edge from-layer="677" from-port="2" to-layer="678" to-port="0" /> <edge from-layer="678" from-port="2" to-layer="679" to-port="1" /> <edge from-layer="679" from-port="2" to-layer="680" to-port="1" /> <edge from-layer="680" from-port="2" to-layer="681" to-port="0" /> <edge from-layer="680" from-port="2" to-layer="6136" to-port="0" /> <edge from-layer="681" from-port="2" to-layer="682" to-port="0" /> <edge from-layer="682" from-port="2" to-layer="684" to-port="0" /> <edge from-layer="683" from-port="0" to-layer="684" to-port="1" /> <edge from-layer="684" from-port="2" to-layer="706" to-port="1" /> <edge from-layer="685" from-port="1" to-layer="687" to-port="0" /> <edge from-layer="686" from-port="0" to-layer="687" to-port="2" /> <edge from-layer="687" from-port="3" to-layer="701" to-port="0" /> <edge from-layer="688" from-port="0" to-layer="689" to-port="0" /> <edge from-layer="689" from-port="1" to-layer="692" to-port="0" /> <edge from-layer="690" from-port="0" to-layer="691" to-port="0" /> <edge from-layer="691" from-port="1" to-layer="692" to-port="1" /> <edge from-layer="692" from-port="2" to-layer="694" to-port="0" /> <edge from-layer="693" from-port="0" to-layer="694" to-port="1" /> <edge from-layer="694" from-port="2" to-layer="695" to-port="0" /> <edge from-layer="695" from-port="1" to-layer="696" to-port="1" /> <edge from-layer="696" from-port="2" to-layer="698" to-port="0" /> <edge from-layer="697" from-port="0" to-layer="698" to-port="1" /> <edge from-layer="698" from-port="2" to-layer="700" to-port="0" /> <edge from-layer="699" from-port="0" to-layer="700" to-port="1" /> <edge from-layer="700" from-port="2" to-layer="701" to-port="1" /> <edge from-layer="701" from-port="2" to-layer="702" to-port="0" /> <edge from-layer="701" from-port="2" to-layer="6135" to-port="0" /> <edge from-layer="702" from-port="2" to-layer="703" to-port="0" /> <edge from-layer="703" from-port="2" to-layer="705" to-port="0" /> <edge from-layer="704" from-port="0" to-layer="705" to-port="1" /> <edge from-layer="705" from-port="2" to-layer="706" to-port="2" /> <edge from-layer="706" from-port="4" to-layer="708" to-port="0" /> <edge from-layer="707" from-port="0" to-layer="708" to-port="1" /> <edge from-layer="708" from-port="2" to-layer="709" to-port="0" /> <edge from-layer="709" from-port="2" to-layer="718" to-port="0" /> <edge from-layer="710" from-port="0" to-layer="711" to-port="0" /> <edge from-layer="711" from-port="1" to-layer="714" to-port="0" /> <edge from-layer="712" from-port="0" to-layer="713" to-port="0" /> <edge from-layer="713" from-port="1" to-layer="714" to-port="1" /> <edge from-layer="714" from-port="2" to-layer="716" to-port="0" /> <edge from-layer="715" from-port="0" to-layer="716" to-port="1" /> <edge from-layer="716" from-port="2" to-layer="717" to-port="0" /> <edge from-layer="717" from-port="1" to-layer="718" to-port="1" /> <edge from-layer="718" from-port="2" to-layer="719" to-port="1" /> <edge from-layer="719" from-port="2" to-layer="761" to-port="0" /> <edge from-layer="719" from-port="2" to-layer="730" to-port="0" /> <edge from-layer="719" from-port="2" to-layer="723" to-port="0" /> <edge from-layer="720" from-port="0" to-layer="731" to-port="0" /> <edge from-layer="721" from-port="0" to-layer="729" to-port="0" /> <edge from-layer="722" from-port="0" to-layer="723" to-port="1" /> <edge from-layer="723" from-port="2" to-layer="725" to-port="0" /> <edge from-layer="724" from-port="0" to-layer="725" to-port="1" /> <edge from-layer="725" from-port="2" to-layer="727" to-port="0" /> <edge from-layer="726" from-port="0" to-layer="727" to-port="1" /> <edge from-layer="727" from-port="2" to-layer="728" to-port="0" /> <edge from-layer="728" from-port="1" to-layer="729" to-port="1" /> <edge from-layer="729" from-port="2" to-layer="730" to-port="1" /> <edge from-layer="730" from-port="2" to-layer="731" to-port="1" /> <edge from-layer="731" from-port="2" to-layer="750" to-port="0" /> <edge from-layer="731" from-port="2" to-layer="740" to-port="0" /> <edge from-layer="732" from-port="0" to-layer="733" to-port="0" /> <edge from-layer="733" from-port="1" to-layer="736" to-port="0" /> <edge from-layer="734" from-port="0" to-layer="735" to-port="0" /> <edge from-layer="735" from-port="1" to-layer="736" to-port="1" /> <edge from-layer="736" from-port="2" to-layer="738" to-port="0" /> <edge from-layer="737" from-port="0" to-layer="738" to-port="1" /> <edge from-layer="738" from-port="2" to-layer="739" to-port="0" /> <edge from-layer="739" from-port="1" to-layer="740" to-port="1" /> <edge from-layer="740" from-port="2" to-layer="741" to-port="0" /> <edge from-layer="741" from-port="1" to-layer="751" to-port="0" /> <edge from-layer="742" from-port="0" to-layer="743" to-port="0" /> <edge from-layer="743" from-port="1" to-layer="746" to-port="0" /> <edge from-layer="744" from-port="0" to-layer="745" to-port="0" /> <edge from-layer="745" from-port="1" to-layer="746" to-port="1" /> <edge from-layer="746" from-port="2" to-layer="748" to-port="0" /> <edge from-layer="747" from-port="0" to-layer="748" to-port="1" /> <edge from-layer="748" from-port="2" to-layer="749" to-port="0" /> <edge from-layer="749" from-port="1" to-layer="750" to-port="1" /> <edge from-layer="750" from-port="2" to-layer="751" to-port="1" /> <edge from-layer="751" from-port="2" to-layer="760" to-port="0" /> <edge from-layer="752" from-port="0" to-layer="753" to-port="0" /> <edge from-layer="753" from-port="1" to-layer="756" to-port="0" /> <edge from-layer="754" from-port="0" to-layer="755" to-port="0" /> <edge from-layer="755" from-port="1" to-layer="756" to-port="1" /> <edge from-layer="756" from-port="2" to-layer="758" to-port="0" /> <edge from-layer="757" from-port="0" to-layer="758" to-port="1" /> <edge from-layer="758" from-port="2" to-layer="759" to-port="0" /> <edge from-layer="759" from-port="1" to-layer="760" to-port="1" /> <edge from-layer="760" from-port="2" to-layer="761" to-port="1" /> <edge from-layer="761" from-port="2" to-layer="870" to-port="0" /> <edge from-layer="761" from-port="2" to-layer="772" to-port="0" /> <edge from-layer="761" from-port="2" to-layer="765" to-port="0" /> <edge from-layer="762" from-port="0" to-layer="773" to-port="0" /> <edge from-layer="763" from-port="0" to-layer="771" to-port="0" /> <edge from-layer="764" from-port="0" to-layer="765" to-port="1" /> <edge from-layer="765" from-port="2" to-layer="767" to-port="0" /> <edge from-layer="766" from-port="0" to-layer="767" to-port="1" /> <edge from-layer="767" from-port="2" to-layer="769" to-port="0" /> <edge from-layer="768" from-port="0" to-layer="769" to-port="1" /> <edge from-layer="769" from-port="2" to-layer="770" to-port="0" /> <edge from-layer="770" from-port="1" to-layer="771" to-port="1" /> <edge from-layer="771" from-port="2" to-layer="772" to-port="1" /> <edge from-layer="772" from-port="2" to-layer="773" to-port="1" /> <edge from-layer="773" from-port="2" to-layer="782" to-port="0" /> <edge from-layer="773" from-port="2" to-layer="847" to-port="0" /> <edge from-layer="773" from-port="2" to-layer="812" to-port="0" /> <edge from-layer="774" from-port="0" to-layer="775" to-port="0" /> <edge from-layer="775" from-port="1" to-layer="778" to-port="0" /> <edge from-layer="776" from-port="0" to-layer="777" to-port="0" /> <edge from-layer="777" from-port="1" to-layer="778" to-port="1" /> <edge from-layer="778" from-port="2" to-layer="780" to-port="0" /> <edge from-layer="779" from-port="0" to-layer="780" to-port="1" /> <edge from-layer="780" from-port="2" to-layer="781" to-port="0" /> <edge from-layer="781" from-port="1" to-layer="782" to-port="1" /> <edge from-layer="782" from-port="2" to-layer="784" to-port="0" /> <edge from-layer="783" from-port="0" to-layer="784" to-port="1" /> <edge from-layer="784" from-port="2" to-layer="786" to-port="0" /> <edge from-layer="785" from-port="0" to-layer="786" to-port="1" /> <edge from-layer="786" from-port="2" to-layer="791" to-port="0" /> <edge from-layer="786" from-port="2" to-layer="797" to-port="0" /> <edge from-layer="786" from-port="2" to-layer="787" to-port="0" /> <edge from-layer="787" from-port="2" to-layer="800" to-port="0" /> <edge from-layer="788" from-port="0" to-layer="791" to-port="1" /> <edge from-layer="789" from-port="0" to-layer="791" to-port="2" /> <edge from-layer="790" from-port="0" to-layer="791" to-port="3" /> <edge from-layer="791" from-port="5" to-layer="793" to-port="0" /> <edge from-layer="792" from-port="0" to-layer="793" to-port="1" /> <edge from-layer="793" from-port="2" to-layer="798" to-port="0" /> <edge from-layer="794" from-port="0" to-layer="797" to-port="1" /> <edge from-layer="795" from-port="0" to-layer="797" to-port="2" /> <edge from-layer="796" from-port="0" to-layer="797" to-port="3" /> <edge from-layer="797" from-port="5" to-layer="798" to-port="1" /> <edge from-layer="798" from-port="2" to-layer="799" to-port="0" /> <edge from-layer="799" from-port="2" to-layer="800" to-port="1" /> <edge from-layer="800" from-port="2" to-layer="857" to-port="0" /> <edge from-layer="801" from-port="1" to-layer="803" to-port="0" /> <edge from-layer="802" from-port="0" to-layer="803" to-port="2" /> <edge from-layer="803" from-port="3" to-layer="831" to-port="0" /> <edge from-layer="804" from-port="0" to-layer="805" to-port="0" /> <edge from-layer="805" from-port="1" to-layer="808" to-port="0" /> <edge from-layer="806" from-port="0" to-layer="807" to-port="0" /> <edge from-layer="807" from-port="1" to-layer="808" to-port="1" /> <edge from-layer="808" from-port="2" to-layer="810" to-port="0" /> <edge from-layer="809" from-port="0" to-layer="810" to-port="1" /> <edge from-layer="810" from-port="2" to-layer="811" to-port="0" /> <edge from-layer="811" from-port="1" to-layer="812" to-port="1" /> <edge from-layer="812" from-port="2" to-layer="814" to-port="0" /> <edge from-layer="813" from-port="0" to-layer="814" to-port="1" /> <edge from-layer="814" from-port="2" to-layer="816" to-port="0" /> <edge from-layer="815" from-port="0" to-layer="816" to-port="1" /> <edge from-layer="816" from-port="2" to-layer="817" to-port="0" /> <edge from-layer="816" from-port="2" to-layer="827" to-port="0" /> <edge from-layer="816" from-port="2" to-layer="821" to-port="0" /> <edge from-layer="817" from-port="2" to-layer="830" to-port="0" /> <edge from-layer="818" from-port="0" to-layer="821" to-port="1" /> <edge from-layer="819" from-port="0" to-layer="821" to-port="2" /> <edge from-layer="820" from-port="0" to-layer="821" to-port="3" /> <edge from-layer="821" from-port="5" to-layer="823" to-port="0" /> <edge from-layer="822" from-port="0" to-layer="823" to-port="1" /> <edge from-layer="823" from-port="2" to-layer="828" to-port="0" /> <edge from-layer="824" from-port="0" to-layer="827" to-port="1" /> <edge from-layer="825" from-port="0" to-layer="827" to-port="2" /> <edge from-layer="826" from-port="0" to-layer="827" to-port="3" /> <edge from-layer="827" from-port="5" to-layer="828" to-port="1" /> <edge from-layer="828" from-port="2" to-layer="829" to-port="0" /> <edge from-layer="829" from-port="2" to-layer="830" to-port="1" /> <edge from-layer="830" from-port="2" to-layer="831" to-port="1" /> <edge from-layer="831" from-port="2" to-layer="1584" to-port="0" /> <edge from-layer="831" from-port="2" to-layer="832" to-port="0" /> <edge from-layer="832" from-port="2" to-layer="833" to-port="0" /> <edge from-layer="833" from-port="2" to-layer="835" to-port="0" /> <edge from-layer="834" from-port="0" to-layer="835" to-port="1" /> <edge from-layer="835" from-port="2" to-layer="857" to-port="1" /> <edge from-layer="836" from-port="1" to-layer="838" to-port="0" /> <edge from-layer="837" from-port="0" to-layer="838" to-port="2" /> <edge from-layer="838" from-port="3" to-layer="852" to-port="0" /> <edge from-layer="839" from-port="0" to-layer="840" to-port="0" /> <edge from-layer="840" from-port="1" to-layer="843" to-port="0" /> <edge from-layer="841" from-port="0" to-layer="842" to-port="0" /> <edge from-layer="842" from-port="1" to-layer="843" to-port="1" /> <edge from-layer="843" from-port="2" to-layer="845" to-port="0" /> <edge from-layer="844" from-port="0" to-layer="845" to-port="1" /> <edge from-layer="845" from-port="2" to-layer="846" to-port="0" /> <edge from-layer="846" from-port="1" to-layer="847" to-port="1" /> <edge from-layer="847" from-port="2" to-layer="849" to-port="0" /> <edge from-layer="848" from-port="0" to-layer="849" to-port="1" /> <edge from-layer="849" from-port="2" to-layer="851" to-port="0" /> <edge from-layer="850" from-port="0" to-layer="851" to-port="1" /> <edge from-layer="851" from-port="2" to-layer="852" to-port="1" /> <edge from-layer="852" from-port="2" to-layer="1583" to-port="0" /> <edge from-layer="852" from-port="2" to-layer="853" to-port="0" /> <edge from-layer="853" from-port="2" to-layer="854" to-port="0" /> <edge from-layer="854" from-port="2" to-layer="856" to-port="0" /> <edge from-layer="855" from-port="0" to-layer="856" to-port="1" /> <edge from-layer="856" from-port="2" to-layer="857" to-port="2" /> <edge from-layer="857" from-port="4" to-layer="859" to-port="0" /> <edge from-layer="858" from-port="0" to-layer="859" to-port="1" /> <edge from-layer="859" from-port="2" to-layer="860" to-port="0" /> <edge from-layer="860" from-port="2" to-layer="869" to-port="0" /> <edge from-layer="861" from-port="0" to-layer="862" to-port="0" /> <edge from-layer="862" from-port="1" to-layer="865" to-port="0" /> <edge from-layer="863" from-port="0" to-layer="864" to-port="0" /> <edge from-layer="864" from-port="1" to-layer="865" to-port="1" /> <edge from-layer="865" from-port="2" to-layer="867" to-port="0" /> <edge from-layer="866" from-port="0" to-layer="867" to-port="1" /> <edge from-layer="867" from-port="2" to-layer="868" to-port="0" /> <edge from-layer="868" from-port="1" to-layer="869" to-port="1" /> <edge from-layer="869" from-port="2" to-layer="870" to-port="1" /> <edge from-layer="870" from-port="2" to-layer="912" to-port="0" /> <edge from-layer="870" from-port="2" to-layer="874" to-port="0" /> <edge from-layer="870" from-port="2" to-layer="881" to-port="0" /> <edge from-layer="871" from-port="0" to-layer="882" to-port="0" /> <edge from-layer="872" from-port="0" to-layer="880" to-port="0" /> <edge from-layer="873" from-port="0" to-layer="874" to-port="1" /> <edge from-layer="874" from-port="2" to-layer="876" to-port="0" /> <edge from-layer="875" from-port="0" to-layer="876" to-port="1" /> <edge from-layer="876" from-port="2" to-layer="878" to-port="0" /> <edge from-layer="877" from-port="0" to-layer="878" to-port="1" /> <edge from-layer="878" from-port="2" to-layer="879" to-port="0" /> <edge from-layer="879" from-port="1" to-layer="880" to-port="1" /> <edge from-layer="880" from-port="2" to-layer="881" to-port="1" /> <edge from-layer="881" from-port="2" to-layer="882" to-port="1" /> <edge from-layer="882" from-port="2" to-layer="901" to-port="0" /> <edge from-layer="882" from-port="2" to-layer="891" to-port="0" /> <edge from-layer="883" from-port="0" to-layer="884" to-port="0" /> <edge from-layer="884" from-port="1" to-layer="887" to-port="0" /> <edge from-layer="885" from-port="0" to-layer="886" to-port="0" /> <edge from-layer="886" from-port="1" to-layer="887" to-port="1" /> <edge from-layer="887" from-port="2" to-layer="889" to-port="0" /> <edge from-layer="888" from-port="0" to-layer="889" to-port="1" /> <edge from-layer="889" from-port="2" to-layer="890" to-port="0" /> <edge from-layer="890" from-port="1" to-layer="891" to-port="1" /> <edge from-layer="891" from-port="2" to-layer="892" to-port="0" /> <edge from-layer="892" from-port="1" to-layer="902" to-port="0" /> <edge from-layer="893" from-port="0" to-layer="894" to-port="0" /> <edge from-layer="894" from-port="1" to-layer="897" to-port="0" /> <edge from-layer="895" from-port="0" to-layer="896" to-port="0" /> <edge from-layer="896" from-port="1" to-layer="897" to-port="1" /> <edge from-layer="897" from-port="2" to-layer="899" to-port="0" /> <edge from-layer="898" from-port="0" to-layer="899" to-port="1" /> <edge from-layer="899" from-port="2" to-layer="900" to-port="0" /> <edge from-layer="900" from-port="1" to-layer="901" to-port="1" /> <edge from-layer="901" from-port="2" to-layer="902" to-port="1" /> <edge from-layer="902" from-port="2" to-layer="911" to-port="0" /> <edge from-layer="903" from-port="0" to-layer="904" to-port="0" /> <edge from-layer="904" from-port="1" to-layer="907" to-port="0" /> <edge from-layer="905" from-port="0" to-layer="906" to-port="0" /> <edge from-layer="906" from-port="1" to-layer="907" to-port="1" /> <edge from-layer="907" from-port="2" to-layer="909" to-port="0" /> <edge from-layer="908" from-port="0" to-layer="909" to-port="1" /> <edge from-layer="909" from-port="2" to-layer="910" to-port="0" /> <edge from-layer="910" from-port="1" to-layer="911" to-port="1" /> <edge from-layer="911" from-port="2" to-layer="912" to-port="1" /> <edge from-layer="912" from-port="2" to-layer="923" to-port="0" /> <edge from-layer="912" from-port="2" to-layer="916" to-port="0" /> <edge from-layer="912" from-port="2" to-layer="1021" to-port="0" /> <edge from-layer="913" from-port="0" to-layer="924" to-port="0" /> <edge from-layer="914" from-port="0" to-layer="922" to-port="0" /> <edge from-layer="915" from-port="0" to-layer="916" to-port="1" /> <edge from-layer="916" from-port="2" to-layer="918" to-port="0" /> <edge from-layer="917" from-port="0" to-layer="918" to-port="1" /> <edge from-layer="918" from-port="2" to-layer="920" to-port="0" /> <edge from-layer="919" from-port="0" to-layer="920" to-port="1" /> <edge from-layer="920" from-port="2" to-layer="921" to-port="0" /> <edge from-layer="921" from-port="1" to-layer="922" to-port="1" /> <edge from-layer="922" from-port="2" to-layer="923" to-port="1" /> <edge from-layer="923" from-port="2" to-layer="924" to-port="1" /> <edge from-layer="924" from-port="2" to-layer="933" to-port="0" /> <edge from-layer="924" from-port="2" to-layer="963" to-port="0" /> <edge from-layer="924" from-port="2" to-layer="998" to-port="0" /> <edge from-layer="925" from-port="0" to-layer="926" to-port="0" /> <edge from-layer="926" from-port="1" to-layer="929" to-port="0" /> <edge from-layer="927" from-port="0" to-layer="928" to-port="0" /> <edge from-layer="928" from-port="1" to-layer="929" to-port="1" /> <edge from-layer="929" from-port="2" to-layer="931" to-port="0" /> <edge from-layer="930" from-port="0" to-layer="931" to-port="1" /> <edge from-layer="931" from-port="2" to-layer="932" to-port="0" /> <edge from-layer="932" from-port="1" to-layer="933" to-port="1" /> <edge from-layer="933" from-port="2" to-layer="935" to-port="0" /> <edge from-layer="934" from-port="0" to-layer="935" to-port="1" /> <edge from-layer="935" from-port="2" to-layer="937" to-port="0" /> <edge from-layer="936" from-port="0" to-layer="937" to-port="1" /> <edge from-layer="937" from-port="2" to-layer="948" to-port="0" /> <edge from-layer="937" from-port="2" to-layer="938" to-port="0" /> <edge from-layer="937" from-port="2" to-layer="942" to-port="0" /> <edge from-layer="938" from-port="2" to-layer="951" to-port="0" /> <edge from-layer="939" from-port="0" to-layer="942" to-port="1" /> <edge from-layer="940" from-port="0" to-layer="942" to-port="2" /> <edge from-layer="941" from-port="0" to-layer="942" to-port="3" /> <edge from-layer="942" from-port="5" to-layer="944" to-port="0" /> <edge from-layer="943" from-port="0" to-layer="944" to-port="1" /> <edge from-layer="944" from-port="2" to-layer="949" to-port="0" /> <edge from-layer="945" from-port="0" to-layer="948" to-port="1" /> <edge from-layer="946" from-port="0" to-layer="948" to-port="2" /> <edge from-layer="947" from-port="0" to-layer="948" to-port="3" /> <edge from-layer="948" from-port="5" to-layer="949" to-port="1" /> <edge from-layer="949" from-port="2" to-layer="950" to-port="0" /> <edge from-layer="950" from-port="2" to-layer="951" to-port="1" /> <edge from-layer="951" from-port="2" to-layer="1008" to-port="0" /> <edge from-layer="952" from-port="1" to-layer="954" to-port="0" /> <edge from-layer="953" from-port="0" to-layer="954" to-port="2" /> <edge from-layer="954" from-port="3" to-layer="982" to-port="0" /> <edge from-layer="955" from-port="0" to-layer="956" to-port="0" /> <edge from-layer="956" from-port="1" to-layer="959" to-port="0" /> <edge from-layer="957" from-port="0" to-layer="958" to-port="0" /> <edge from-layer="958" from-port="1" to-layer="959" to-port="1" /> <edge from-layer="959" from-port="2" to-layer="961" to-port="0" /> <edge from-layer="960" from-port="0" to-layer="961" to-port="1" /> <edge from-layer="961" from-port="2" to-layer="962" to-port="0" /> <edge from-layer="962" from-port="1" to-layer="963" to-port="1" /> <edge from-layer="963" from-port="2" to-layer="965" to-port="0" /> <edge from-layer="964" from-port="0" to-layer="965" to-port="1" /> <edge from-layer="965" from-port="2" to-layer="967" to-port="0" /> <edge from-layer="966" from-port="0" to-layer="967" to-port="1" /> <edge from-layer="967" from-port="2" to-layer="968" to-port="0" /> <edge from-layer="967" from-port="2" to-layer="972" to-port="0" /> <edge from-layer="967" from-port="2" to-layer="978" to-port="0" /> <edge from-layer="968" from-port="2" to-layer="981" to-port="0" /> <edge from-layer="969" from-port="0" to-layer="972" to-port="1" /> <edge from-layer="970" from-port="0" to-layer="972" to-port="2" /> <edge from-layer="971" from-port="0" to-layer="972" to-port="3" /> <edge from-layer="972" from-port="5" to-layer="974" to-port="0" /> <edge from-layer="973" from-port="0" to-layer="974" to-port="1" /> <edge from-layer="974" from-port="2" to-layer="979" to-port="0" /> <edge from-layer="975" from-port="0" to-layer="978" to-port="1" /> <edge from-layer="976" from-port="0" to-layer="978" to-port="2" /> <edge from-layer="977" from-port="0" to-layer="978" to-port="3" /> <edge from-layer="978" from-port="5" to-layer="979" to-port="1" /> <edge from-layer="979" from-port="2" to-layer="980" to-port="0" /> <edge from-layer="980" from-port="2" to-layer="981" to-port="1" /> <edge from-layer="981" from-port="2" to-layer="982" to-port="1" /> <edge from-layer="982" from-port="2" to-layer="983" to-port="0" /> <edge from-layer="982" from-port="2" to-layer="1582" to-port="0" /> <edge from-layer="983" from-port="2" to-layer="984" to-port="0" /> <edge from-layer="984" from-port="2" to-layer="986" to-port="0" /> <edge from-layer="985" from-port="0" to-layer="986" to-port="1" /> <edge from-layer="986" from-port="2" to-layer="1008" to-port="1" /> <edge from-layer="987" from-port="1" to-layer="989" to-port="0" /> <edge from-layer="988" from-port="0" to-layer="989" to-port="2" /> <edge from-layer="989" from-port="3" to-layer="1003" to-port="0" /> <edge from-layer="990" from-port="0" to-layer="991" to-port="0" /> <edge from-layer="991" from-port="1" to-layer="994" to-port="0" /> <edge from-layer="992" from-port="0" to-layer="993" to-port="0" /> <edge from-layer="993" from-port="1" to-layer="994" to-port="1" /> <edge from-layer="994" from-port="2" to-layer="996" to-port="0" /> <edge from-layer="995" from-port="0" to-layer="996" to-port="1" /> <edge from-layer="996" from-port="2" to-layer="997" to-port="0" /> <edge from-layer="997" from-port="1" to-layer="998" to-port="1" /> <edge from-layer="998" from-port="2" to-layer="1000" to-port="0" /> <edge from-layer="999" from-port="0" to-layer="1000" to-port="1" /> <edge from-layer="1000" from-port="2" to-layer="1002" to-port="0" /> <edge from-layer="1001" from-port="0" to-layer="1002" to-port="1" /> <edge from-layer="1002" from-port="2" to-layer="1003" to-port="1" /> <edge from-layer="1003" from-port="2" to-layer="1581" to-port="0" /> <edge from-layer="1003" from-port="2" to-layer="1004" to-port="0" /> <edge from-layer="1004" from-port="2" to-layer="1005" to-port="0" /> <edge from-layer="1005" from-port="2" to-layer="1007" to-port="0" /> <edge from-layer="1006" from-port="0" to-layer="1007" to-port="1" /> <edge from-layer="1007" from-port="2" to-layer="1008" to-port="2" /> <edge from-layer="1008" from-port="4" to-layer="1010" to-port="0" /> <edge from-layer="1009" from-port="0" to-layer="1010" to-port="1" /> <edge from-layer="1010" from-port="2" to-layer="1011" to-port="0" /> <edge from-layer="1011" from-port="2" to-layer="1020" to-port="0" /> <edge from-layer="1012" from-port="0" to-layer="1013" to-port="0" /> <edge from-layer="1013" from-port="1" to-layer="1016" to-port="0" /> <edge from-layer="1014" from-port="0" to-layer="1015" to-port="0" /> <edge from-layer="1015" from-port="1" to-layer="1016" to-port="1" /> <edge from-layer="1016" from-port="2" to-layer="1018" to-port="0" /> <edge from-layer="1017" from-port="0" to-layer="1018" to-port="1" /> <edge from-layer="1018" from-port="2" to-layer="1019" to-port="0" /> <edge from-layer="1019" from-port="1" to-layer="1020" to-port="1" /> <edge from-layer="1020" from-port="2" to-layer="1021" to-port="1" /> <edge from-layer="1021" from-port="2" to-layer="1063" to-port="0" /> <edge from-layer="1021" from-port="2" to-layer="1032" to-port="0" /> <edge from-layer="1021" from-port="2" to-layer="1025" to-port="0" /> <edge from-layer="1022" from-port="0" to-layer="1033" to-port="0" /> <edge from-layer="1023" from-port="0" to-layer="1031" to-port="0" /> <edge from-layer="1024" from-port="0" to-layer="1025" to-port="1" /> <edge from-layer="1025" from-port="2" to-layer="1027" to-port="0" /> <edge from-layer="1026" from-port="0" to-layer="1027" to-port="1" /> <edge from-layer="1027" from-port="2" to-layer="1029" to-port="0" /> <edge from-layer="1028" from-port="0" to-layer="1029" to-port="1" /> <edge from-layer="1029" from-port="2" to-layer="1030" to-port="0" /> <edge from-layer="1030" from-port="1" to-layer="1031" to-port="1" /> <edge from-layer="1031" from-port="2" to-layer="1032" to-port="1" /> <edge from-layer="1032" from-port="2" to-layer="1033" to-port="1" /> <edge from-layer="1033" from-port="2" to-layer="1042" to-port="0" /> <edge from-layer="1033" from-port="2" to-layer="1052" to-port="0" /> <edge from-layer="1034" from-port="0" to-layer="1035" to-port="0" /> <edge from-layer="1035" from-port="1" to-layer="1038" to-port="0" /> <edge from-layer="1036" from-port="0" to-layer="1037" to-port="0" /> <edge from-layer="1037" from-port="1" to-layer="1038" to-port="1" /> <edge from-layer="1038" from-port="2" to-layer="1040" to-port="0" /> <edge from-layer="1039" from-port="0" to-layer="1040" to-port="1" /> <edge from-layer="1040" from-port="2" to-layer="1041" to-port="0" /> <edge from-layer="1041" from-port="1" to-layer="1042" to-port="1" /> <edge from-layer="1042" from-port="2" to-layer="1043" to-port="0" /> <edge from-layer="1043" from-port="1" to-layer="1053" to-port="0" /> <edge from-layer="1044" from-port="0" to-layer="1045" to-port="0" /> <edge from-layer="1045" from-port="1" to-layer="1048" to-port="0" /> <edge from-layer="1046" from-port="0" to-layer="1047" to-port="0" /> <edge from-layer="1047" from-port="1" to-layer="1048" to-port="1" /> <edge from-layer="1048" from-port="2" to-layer="1050" to-port="0" /> <edge from-layer="1049" from-port="0" to-layer="1050" to-port="1" /> <edge from-layer="1050" from-port="2" to-layer="1051" to-port="0" /> <edge from-layer="1051" from-port="1" to-layer="1052" to-port="1" /> <edge from-layer="1052" from-port="2" to-layer="1053" to-port="1" /> <edge from-layer="1053" from-port="2" to-layer="1062" to-port="0" /> <edge from-layer="1054" from-port="0" to-layer="1055" to-port="0" /> <edge from-layer="1055" from-port="1" to-layer="1058" to-port="0" /> <edge from-layer="1056" from-port="0" to-layer="1057" to-port="0" /> <edge from-layer="1057" from-port="1" to-layer="1058" to-port="1" /> <edge from-layer="1058" from-port="2" to-layer="1060" to-port="0" /> <edge from-layer="1059" from-port="0" to-layer="1060" to-port="1" /> <edge from-layer="1060" from-port="2" to-layer="1061" to-port="0" /> <edge from-layer="1061" from-port="1" to-layer="1062" to-port="1" /> <edge from-layer="1062" from-port="2" to-layer="1063" to-port="1" /> <edge from-layer="1063" from-port="2" to-layer="1074" to-port="0" /> <edge from-layer="1063" from-port="2" to-layer="1172" to-port="0" /> <edge from-layer="1063" from-port="2" to-layer="1067" to-port="0" /> <edge from-layer="1064" from-port="0" to-layer="1075" to-port="0" /> <edge from-layer="1065" from-port="0" to-layer="1073" to-port="0" /> <edge from-layer="1066" from-port="0" to-layer="1067" to-port="1" /> <edge from-layer="1067" from-port="2" to-layer="1069" to-port="0" /> <edge from-layer="1068" from-port="0" to-layer="1069" to-port="1" /> <edge from-layer="1069" from-port="2" to-layer="1071" to-port="0" /> <edge from-layer="1070" from-port="0" to-layer="1071" to-port="1" /> <edge from-layer="1071" from-port="2" to-layer="1072" to-port="0" /> <edge from-layer="1072" from-port="1" to-layer="1073" to-port="1" /> <edge from-layer="1073" from-port="2" to-layer="1074" to-port="1" /> <edge from-layer="1074" from-port="2" to-layer="1075" to-port="1" /> <edge from-layer="1075" from-port="2" to-layer="1149" to-port="0" /> <edge from-layer="1075" from-port="2" to-layer="1114" to-port="0" /> <edge from-layer="1075" from-port="2" to-layer="1084" to-port="0" /> <edge from-layer="1076" from-port="0" to-layer="1077" to-port="0" /> <edge from-layer="1077" from-port="1" to-layer="1080" to-port="0" /> <edge from-layer="1078" from-port="0" to-layer="1079" to-port="0" /> <edge from-layer="1079" from-port="1" to-layer="1080" to-port="1" /> <edge from-layer="1080" from-port="2" to-layer="1082" to-port="0" /> <edge from-layer="1081" from-port="0" to-layer="1082" to-port="1" /> <edge from-layer="1082" from-port="2" to-layer="1083" to-port="0" /> <edge from-layer="1083" from-port="1" to-layer="1084" to-port="1" /> <edge from-layer="1084" from-port="2" to-layer="1086" to-port="0" /> <edge from-layer="1085" from-port="0" to-layer="1086" to-port="1" /> <edge from-layer="1086" from-port="2" to-layer="1088" to-port="0" /> <edge from-layer="1087" from-port="0" to-layer="1088" to-port="1" /> <edge from-layer="1088" from-port="2" to-layer="1089" to-port="0" /> <edge from-layer="1088" from-port="2" to-layer="1093" to-port="0" /> <edge from-layer="1088" from-port="2" to-layer="1099" to-port="0" /> <edge from-layer="1089" from-port="2" to-layer="1102" to-port="0" /> <edge from-layer="1090" from-port="0" to-layer="1093" to-port="1" /> <edge from-layer="1091" from-port="0" to-layer="1093" to-port="2" /> <edge from-layer="1092" from-port="0" to-layer="1093" to-port="3" /> <edge from-layer="1093" from-port="5" to-layer="1095" to-port="0" /> <edge from-layer="1094" from-port="0" to-layer="1095" to-port="1" /> <edge from-layer="1095" from-port="2" to-layer="1100" to-port="0" /> <edge from-layer="1096" from-port="0" to-layer="1099" to-port="1" /> <edge from-layer="1097" from-port="0" to-layer="1099" to-port="2" /> <edge from-layer="1098" from-port="0" to-layer="1099" to-port="3" /> <edge from-layer="1099" from-port="5" to-layer="1100" to-port="1" /> <edge from-layer="1100" from-port="2" to-layer="1101" to-port="0" /> <edge from-layer="1101" from-port="2" to-layer="1102" to-port="1" /> <edge from-layer="1102" from-port="2" to-layer="1159" to-port="0" /> <edge from-layer="1103" from-port="1" to-layer="1105" to-port="0" /> <edge from-layer="1104" from-port="0" to-layer="1105" to-port="2" /> <edge from-layer="1105" from-port="3" to-layer="1133" to-port="0" /> <edge from-layer="1106" from-port="0" to-layer="1107" to-port="0" /> <edge from-layer="1107" from-port="1" to-layer="1110" to-port="0" /> <edge from-layer="1108" from-port="0" to-layer="1109" to-port="0" /> <edge from-layer="1109" from-port="1" to-layer="1110" to-port="1" /> <edge from-layer="1110" from-port="2" to-layer="1112" to-port="0" /> <edge from-layer="1111" from-port="0" to-layer="1112" to-port="1" /> <edge from-layer="1112" from-port="2" to-layer="1113" to-port="0" /> <edge from-layer="1113" from-port="1" to-layer="1114" to-port="1" /> <edge from-layer="1114" from-port="2" to-layer="1116" to-port="0" /> <edge from-layer="1115" from-port="0" to-layer="1116" to-port="1" /> <edge from-layer="1116" from-port="2" to-layer="1118" to-port="0" /> <edge from-layer="1117" from-port="0" to-layer="1118" to-port="1" /> <edge from-layer="1118" from-port="2" to-layer="1119" to-port="0" /> <edge from-layer="1118" from-port="2" to-layer="1123" to-port="0" /> <edge from-layer="1118" from-port="2" to-layer="1129" to-port="0" /> <edge from-layer="1119" from-port="2" to-layer="1132" to-port="0" /> <edge from-layer="1120" from-port="0" to-layer="1123" to-port="1" /> <edge from-layer="1121" from-port="0" to-layer="1123" to-port="2" /> <edge from-layer="1122" from-port="0" to-layer="1123" to-port="3" /> <edge from-layer="1123" from-port="5" to-layer="1125" to-port="0" /> <edge from-layer="1124" from-port="0" to-layer="1125" to-port="1" /> <edge from-layer="1125" from-port="2" to-layer="1130" to-port="0" /> <edge from-layer="1126" from-port="0" to-layer="1129" to-port="1" /> <edge from-layer="1127" from-port="0" to-layer="1129" to-port="2" /> <edge from-layer="1128" from-port="0" to-layer="1129" to-port="3" /> <edge from-layer="1129" from-port="5" to-layer="1130" to-port="1" /> <edge from-layer="1130" from-port="2" to-layer="1131" to-port="0" /> <edge from-layer="1131" from-port="2" to-layer="1132" to-port="1" /> <edge from-layer="1132" from-port="2" to-layer="1133" to-port="1" /> <edge from-layer="1133" from-port="2" to-layer="1134" to-port="0" /> <edge from-layer="1133" from-port="2" to-layer="1580" to-port="0" /> <edge from-layer="1134" from-port="2" to-layer="1135" to-port="0" /> <edge from-layer="1135" from-port="2" to-layer="1137" to-port="0" /> <edge from-layer="1136" from-port="0" to-layer="1137" to-port="1" /> <edge from-layer="1137" from-port="2" to-layer="1159" to-port="1" /> <edge from-layer="1138" from-port="1" to-layer="1140" to-port="0" /> <edge from-layer="1139" from-port="0" to-layer="1140" to-port="2" /> <edge from-layer="1140" from-port="3" to-layer="1154" to-port="0" /> <edge from-layer="1141" from-port="0" to-layer="1142" to-port="0" /> <edge from-layer="1142" from-port="1" to-layer="1145" to-port="0" /> <edge from-layer="1143" from-port="0" to-layer="1144" to-port="0" /> <edge from-layer="1144" from-port="1" to-layer="1145" to-port="1" /> <edge from-layer="1145" from-port="2" to-layer="1147" to-port="0" /> <edge from-layer="1146" from-port="0" to-layer="1147" to-port="1" /> <edge from-layer="1147" from-port="2" to-layer="1148" to-port="0" /> <edge from-layer="1148" from-port="1" to-layer="1149" to-port="1" /> <edge from-layer="1149" from-port="2" to-layer="1151" to-port="0" /> <edge from-layer="1150" from-port="0" to-layer="1151" to-port="1" /> <edge from-layer="1151" from-port="2" to-layer="1153" to-port="0" /> <edge from-layer="1152" from-port="0" to-layer="1153" to-port="1" /> <edge from-layer="1153" from-port="2" to-layer="1154" to-port="1" /> <edge from-layer="1154" from-port="2" to-layer="1579" to-port="0" /> <edge from-layer="1154" from-port="2" to-layer="1155" to-port="0" /> <edge from-layer="1155" from-port="2" to-layer="1156" to-port="0" /> <edge from-layer="1156" from-port="2" to-layer="1158" to-port="0" /> <edge from-layer="1157" from-port="0" to-layer="1158" to-port="1" /> <edge from-layer="1158" from-port="2" to-layer="1159" to-port="2" /> <edge from-layer="1159" from-port="4" to-layer="1161" to-port="0" /> <edge from-layer="1160" from-port="0" to-layer="1161" to-port="1" /> <edge from-layer="1161" from-port="2" to-layer="1162" to-port="0" /> <edge from-layer="1162" from-port="2" to-layer="1171" to-port="0" /> <edge from-layer="1163" from-port="0" to-layer="1164" to-port="0" /> <edge from-layer="1164" from-port="1" to-layer="1167" to-port="0" /> <edge from-layer="1165" from-port="0" to-layer="1166" to-port="0" /> <edge from-layer="1166" from-port="1" to-layer="1167" to-port="1" /> <edge from-layer="1167" from-port="2" to-layer="1169" to-port="0" /> <edge from-layer="1168" from-port="0" to-layer="1169" to-port="1" /> <edge from-layer="1169" from-port="2" to-layer="1170" to-port="0" /> <edge from-layer="1170" from-port="1" to-layer="1171" to-port="1" /> <edge from-layer="1171" from-port="2" to-layer="1172" to-port="1" /> <edge from-layer="1172" from-port="2" to-layer="1214" to-port="0" /> <edge from-layer="1172" from-port="2" to-layer="1176" to-port="0" /> <edge from-layer="1172" from-port="2" to-layer="1183" to-port="0" /> <edge from-layer="1173" from-port="0" to-layer="1184" to-port="0" /> <edge from-layer="1174" from-port="0" to-layer="1182" to-port="0" /> <edge from-layer="1175" from-port="0" to-layer="1176" to-port="1" /> <edge from-layer="1176" from-port="2" to-layer="1178" to-port="0" /> <edge from-layer="1177" from-port="0" to-layer="1178" to-port="1" /> <edge from-layer="1178" from-port="2" to-layer="1180" to-port="0" /> <edge from-layer="1179" from-port="0" to-layer="1180" to-port="1" /> <edge from-layer="1180" from-port="2" to-layer="1181" to-port="0" /> <edge from-layer="1181" from-port="1" to-layer="1182" to-port="1" /> <edge from-layer="1182" from-port="2" to-layer="1183" to-port="1" /> <edge from-layer="1183" from-port="2" to-layer="1184" to-port="1" /> <edge from-layer="1184" from-port="2" to-layer="1203" to-port="0" /> <edge from-layer="1184" from-port="2" to-layer="1193" to-port="0" /> <edge from-layer="1185" from-port="0" to-layer="1186" to-port="0" /> <edge from-layer="1186" from-port="1" to-layer="1189" to-port="0" /> <edge from-layer="1187" from-port="0" to-layer="1188" to-port="0" /> <edge from-layer="1188" from-port="1" to-layer="1189" to-port="1" /> <edge from-layer="1189" from-port="2" to-layer="1191" to-port="0" /> <edge from-layer="1190" from-port="0" to-layer="1191" to-port="1" /> <edge from-layer="1191" from-port="2" to-layer="1192" to-port="0" /> <edge from-layer="1192" from-port="1" to-layer="1193" to-port="1" /> <edge from-layer="1193" from-port="2" to-layer="1194" to-port="0" /> <edge from-layer="1194" from-port="1" to-layer="1204" to-port="0" /> <edge from-layer="1195" from-port="0" to-layer="1196" to-port="0" /> <edge from-layer="1196" from-port="1" to-layer="1199" to-port="0" /> <edge from-layer="1197" from-port="0" to-layer="1198" to-port="0" /> <edge from-layer="1198" from-port="1" to-layer="1199" to-port="1" /> <edge from-layer="1199" from-port="2" to-layer="1201" to-port="0" /> <edge from-layer="1200" from-port="0" to-layer="1201" to-port="1" /> <edge from-layer="1201" from-port="2" to-layer="1202" to-port="0" /> <edge from-layer="1202" from-port="1" to-layer="1203" to-port="1" /> <edge from-layer="1203" from-port="2" to-layer="1204" to-port="1" /> <edge from-layer="1204" from-port="2" to-layer="1213" to-port="0" /> <edge from-layer="1205" from-port="0" to-layer="1206" to-port="0" /> <edge from-layer="1206" from-port="1" to-layer="1209" to-port="0" /> <edge from-layer="1207" from-port="0" to-layer="1208" to-port="0" /> <edge from-layer="1208" from-port="1" to-layer="1209" to-port="1" /> <edge from-layer="1209" from-port="2" to-layer="1211" to-port="0" /> <edge from-layer="1210" from-port="0" to-layer="1211" to-port="1" /> <edge from-layer="1211" from-port="2" to-layer="1212" to-port="0" /> <edge from-layer="1212" from-port="1" to-layer="1213" to-port="1" /> <edge from-layer="1213" from-port="2" to-layer="1214" to-port="1" /> <edge from-layer="1214" from-port="2" to-layer="1323" to-port="0" /> <edge from-layer="1214" from-port="2" to-layer="1218" to-port="0" /> <edge from-layer="1214" from-port="2" to-layer="1225" to-port="0" /> <edge from-layer="1215" from-port="0" to-layer="1226" to-port="0" /> <edge from-layer="1216" from-port="0" to-layer="1224" to-port="0" /> <edge from-layer="1217" from-port="0" to-layer="1218" to-port="1" /> <edge from-layer="1218" from-port="2" to-layer="1220" to-port="0" /> <edge from-layer="1219" from-port="0" to-layer="1220" to-port="1" /> <edge from-layer="1220" from-port="2" to-layer="1222" to-port="0" /> <edge from-layer="1221" from-port="0" to-layer="1222" to-port="1" /> <edge from-layer="1222" from-port="2" to-layer="1223" to-port="0" /> <edge from-layer="1223" from-port="1" to-layer="1224" to-port="1" /> <edge from-layer="1224" from-port="2" to-layer="1225" to-port="1" /> <edge from-layer="1225" from-port="2" to-layer="1226" to-port="1" /> <edge from-layer="1226" from-port="2" to-layer="1235" to-port="0" /> <edge from-layer="1226" from-port="2" to-layer="1300" to-port="0" /> <edge from-layer="1226" from-port="2" to-layer="1265" to-port="0" /> <edge from-layer="1227" from-port="0" to-layer="1228" to-port="0" /> <edge from-layer="1228" from-port="1" to-layer="1231" to-port="0" /> <edge from-layer="1229" from-port="0" to-layer="1230" to-port="0" /> <edge from-layer="1230" from-port="1" to-layer="1231" to-port="1" /> <edge from-layer="1231" from-port="2" to-layer="1233" to-port="0" /> <edge from-layer="1232" from-port="0" to-layer="1233" to-port="1" /> <edge from-layer="1233" from-port="2" to-layer="1234" to-port="0" /> <edge from-layer="1234" from-port="1" to-layer="1235" to-port="1" /> <edge from-layer="1235" from-port="2" to-layer="1237" to-port="0" /> <edge from-layer="1236" from-port="0" to-layer="1237" to-port="1" /> <edge from-layer="1237" from-port="2" to-layer="1239" to-port="0" /> <edge from-layer="1238" from-port="0" to-layer="1239" to-port="1" /> <edge from-layer="1239" from-port="2" to-layer="1240" to-port="0" /> <edge from-layer="1239" from-port="2" to-layer="1250" to-port="0" /> <edge from-layer="1239" from-port="2" to-layer="1244" to-port="0" /> <edge from-layer="1240" from-port="2" to-layer="1253" to-port="0" /> <edge from-layer="1241" from-port="0" to-layer="1244" to-port="1" /> <edge from-layer="1242" from-port="0" to-layer="1244" to-port="2" /> <edge from-layer="1243" from-port="0" to-layer="1244" to-port="3" /> <edge from-layer="1244" from-port="5" to-layer="1246" to-port="0" /> <edge from-layer="1245" from-port="0" to-layer="1246" to-port="1" /> <edge from-layer="1246" from-port="2" to-layer="1251" to-port="0" /> <edge from-layer="1247" from-port="0" to-layer="1250" to-port="1" /> <edge from-layer="1248" from-port="0" to-layer="1250" to-port="2" /> <edge from-layer="1249" from-port="0" to-layer="1250" to-port="3" /> <edge from-layer="1250" from-port="5" to-layer="1251" to-port="1" /> <edge from-layer="1251" from-port="2" to-layer="1252" to-port="0" /> <edge from-layer="1252" from-port="2" to-layer="1253" to-port="1" /> <edge from-layer="1253" from-port="2" to-layer="1310" to-port="0" /> <edge from-layer="1254" from-port="1" to-layer="1256" to-port="0" /> <edge from-layer="1255" from-port="0" to-layer="1256" to-port="2" /> <edge from-layer="1256" from-port="3" to-layer="1284" to-port="0" /> <edge from-layer="1257" from-port="0" to-layer="1258" to-port="0" /> <edge from-layer="1258" from-port="1" to-layer="1261" to-port="0" /> <edge from-layer="1259" from-port="0" to-layer="1260" to-port="0" /> <edge from-layer="1260" from-port="1" to-layer="1261" to-port="1" /> <edge from-layer="1261" from-port="2" to-layer="1263" to-port="0" /> <edge from-layer="1262" from-port="0" to-layer="1263" to-port="1" /> <edge from-layer="1263" from-port="2" to-layer="1264" to-port="0" /> <edge from-layer="1264" from-port="1" to-layer="1265" to-port="1" /> <edge from-layer="1265" from-port="2" to-layer="1267" to-port="0" /> <edge from-layer="1266" from-port="0" to-layer="1267" to-port="1" /> <edge from-layer="1267" from-port="2" to-layer="1269" to-port="0" /> <edge from-layer="1268" from-port="0" to-layer="1269" to-port="1" /> <edge from-layer="1269" from-port="2" to-layer="1274" to-port="0" /> <edge from-layer="1269" from-port="2" to-layer="1280" to-port="0" /> <edge from-layer="1269" from-port="2" to-layer="1270" to-port="0" /> <edge from-layer="1270" from-port="2" to-layer="1283" to-port="0" /> <edge from-layer="1271" from-port="0" to-layer="1274" to-port="1" /> <edge from-layer="1272" from-port="0" to-layer="1274" to-port="2" /> <edge from-layer="1273" from-port="0" to-layer="1274" to-port="3" /> <edge from-layer="1274" from-port="5" to-layer="1276" to-port="0" /> <edge from-layer="1275" from-port="0" to-layer="1276" to-port="1" /> <edge from-layer="1276" from-port="2" to-layer="1281" to-port="0" /> <edge from-layer="1277" from-port="0" to-layer="1280" to-port="1" /> <edge from-layer="1278" from-port="0" to-layer="1280" to-port="2" /> <edge from-layer="1279" from-port="0" to-layer="1280" to-port="3" /> <edge from-layer="1280" from-port="5" to-layer="1281" to-port="1" /> <edge from-layer="1281" from-port="2" to-layer="1282" to-port="0" /> <edge from-layer="1282" from-port="2" to-layer="1283" to-port="1" /> <edge from-layer="1283" from-port="2" to-layer="1284" to-port="1" /> <edge from-layer="1284" from-port="2" to-layer="1578" to-port="0" /> <edge from-layer="1284" from-port="2" to-layer="1285" to-port="0" /> <edge from-layer="1285" from-port="2" to-layer="1286" to-port="0" /> <edge from-layer="1286" from-port="2" to-layer="1288" to-port="0" /> <edge from-layer="1287" from-port="0" to-layer="1288" to-port="1" /> <edge from-layer="1288" from-port="2" to-layer="1310" to-port="1" /> <edge from-layer="1289" from-port="1" to-layer="1291" to-port="0" /> <edge from-layer="1290" from-port="0" to-layer="1291" to-port="2" /> <edge from-layer="1291" from-port="3" to-layer="1305" to-port="0" /> <edge from-layer="1292" from-port="0" to-layer="1293" to-port="0" /> <edge from-layer="1293" from-port="1" to-layer="1296" to-port="0" /> <edge from-layer="1294" from-port="0" to-layer="1295" to-port="0" /> <edge from-layer="1295" from-port="1" to-layer="1296" to-port="1" /> <edge from-layer="1296" from-port="2" to-layer="1298" to-port="0" /> <edge from-layer="1297" from-port="0" to-layer="1298" to-port="1" /> <edge from-layer="1298" from-port="2" to-layer="1299" to-port="0" /> <edge from-layer="1299" from-port="1" to-layer="1300" to-port="1" /> <edge from-layer="1300" from-port="2" to-layer="1302" to-port="0" /> <edge from-layer="1301" from-port="0" to-layer="1302" to-port="1" /> <edge from-layer="1302" from-port="2" to-layer="1304" to-port="0" /> <edge from-layer="1303" from-port="0" to-layer="1304" to-port="1" /> <edge from-layer="1304" from-port="2" to-layer="1305" to-port="1" /> <edge from-layer="1305" from-port="2" to-layer="1306" to-port="0" /> <edge from-layer="1305" from-port="2" to-layer="1577" to-port="0" /> <edge from-layer="1306" from-port="2" to-layer="1307" to-port="0" /> <edge from-layer="1307" from-port="2" to-layer="1309" to-port="0" /> <edge from-layer="1308" from-port="0" to-layer="1309" to-port="1" /> <edge from-layer="1309" from-port="2" to-layer="1310" to-port="2" /> <edge from-layer="1310" from-port="4" to-layer="1312" to-port="0" /> <edge from-layer="1311" from-port="0" to-layer="1312" to-port="1" /> <edge from-layer="1312" from-port="2" to-layer="1313" to-port="0" /> <edge from-layer="1313" from-port="2" to-layer="1322" to-port="0" /> <edge from-layer="1314" from-port="0" to-layer="1315" to-port="0" /> <edge from-layer="1315" from-port="1" to-layer="1318" to-port="0" /> <edge from-layer="1316" from-port="0" to-layer="1317" to-port="0" /> <edge from-layer="1317" from-port="1" to-layer="1318" to-port="1" /> <edge from-layer="1318" from-port="2" to-layer="1320" to-port="0" /> <edge from-layer="1319" from-port="0" to-layer="1320" to-port="1" /> <edge from-layer="1320" from-port="2" to-layer="1321" to-port="0" /> <edge from-layer="1321" from-port="1" to-layer="1322" to-port="1" /> <edge from-layer="1322" from-port="2" to-layer="1323" to-port="1" /> <edge from-layer="1323" from-port="2" to-layer="1327" to-port="0" /> <edge from-layer="1323" from-port="2" to-layer="1365" to-port="0" /> <edge from-layer="1323" from-port="2" to-layer="1334" to-port="0" /> <edge from-layer="1324" from-port="0" to-layer="1335" to-port="0" /> <edge from-layer="1325" from-port="0" to-layer="1333" to-port="0" /> <edge from-layer="1326" from-port="0" to-layer="1327" to-port="1" /> <edge from-layer="1327" from-port="2" to-layer="1329" to-port="0" /> <edge from-layer="1328" from-port="0" to-layer="1329" to-port="1" /> <edge from-layer="1329" from-port="2" to-layer="1331" to-port="0" /> <edge from-layer="1330" from-port="0" to-layer="1331" to-port="1" /> <edge from-layer="1331" from-port="2" to-layer="1332" to-port="0" /> <edge from-layer="1332" from-port="1" to-layer="1333" to-port="1" /> <edge from-layer="1333" from-port="2" to-layer="1334" to-port="1" /> <edge from-layer="1334" from-port="2" to-layer="1335" to-port="1" /> <edge from-layer="1335" from-port="2" to-layer="1344" to-port="0" /> <edge from-layer="1335" from-port="2" to-layer="1354" to-port="0" /> <edge from-layer="1336" from-port="0" to-layer="1337" to-port="0" /> <edge from-layer="1337" from-port="1" to-layer="1340" to-port="0" /> <edge from-layer="1338" from-port="0" to-layer="1339" to-port="0" /> <edge from-layer="1339" from-port="1" to-layer="1340" to-port="1" /> <edge from-layer="1340" from-port="2" to-layer="1342" to-port="0" /> <edge from-layer="1341" from-port="0" to-layer="1342" to-port="1" /> <edge from-layer="1342" from-port="2" to-layer="1343" to-port="0" /> <edge from-layer="1343" from-port="1" to-layer="1344" to-port="1" /> <edge from-layer="1344" from-port="2" to-layer="1345" to-port="0" /> <edge from-layer="1345" from-port="1" to-layer="1355" to-port="0" /> <edge from-layer="1346" from-port="0" to-layer="1347" to-port="0" /> <edge from-layer="1347" from-port="1" to-layer="1350" to-port="0" /> <edge from-layer="1348" from-port="0" to-layer="1349" to-port="0" /> <edge from-layer="1349" from-port="1" to-layer="1350" to-port="1" /> <edge from-layer="1350" from-port="2" to-layer="1352" to-port="0" /> <edge from-layer="1351" from-port="0" to-layer="1352" to-port="1" /> <edge from-layer="1352" from-port="2" to-layer="1353" to-port="0" /> <edge from-layer="1353" from-port="1" to-layer="1354" to-port="1" /> <edge from-layer="1354" from-port="2" to-layer="1355" to-port="1" /> <edge from-layer="1355" from-port="2" to-layer="1364" to-port="0" /> <edge from-layer="1356" from-port="0" to-layer="1357" to-port="0" /> <edge from-layer="1357" from-port="1" to-layer="1360" to-port="0" /> <edge from-layer="1358" from-port="0" to-layer="1359" to-port="0" /> <edge from-layer="1359" from-port="1" to-layer="1360" to-port="1" /> <edge from-layer="1360" from-port="2" to-layer="1362" to-port="0" /> <edge from-layer="1361" from-port="0" to-layer="1362" to-port="1" /> <edge from-layer="1362" from-port="2" to-layer="1363" to-port="0" /> <edge from-layer="1363" from-port="1" to-layer="1364" to-port="1" /> <edge from-layer="1364" from-port="2" to-layer="1365" to-port="1" /> <edge from-layer="1365" from-port="2" to-layer="1369" to-port="0" /> <edge from-layer="1365" from-port="2" to-layer="1474" to-port="0" /> <edge from-layer="1365" from-port="2" to-layer="1376" to-port="0" /> <edge from-layer="1366" from-port="0" to-layer="1377" to-port="0" /> <edge from-layer="1367" from-port="0" to-layer="1375" to-port="0" /> <edge from-layer="1368" from-port="0" to-layer="1369" to-port="1" /> <edge from-layer="1369" from-port="2" to-layer="1371" to-port="0" /> <edge from-layer="1370" from-port="0" to-layer="1371" to-port="1" /> <edge from-layer="1371" from-port="2" to-layer="1373" to-port="0" /> <edge from-layer="1372" from-port="0" to-layer="1373" to-port="1" /> <edge from-layer="1373" from-port="2" to-layer="1374" to-port="0" /> <edge from-layer="1374" from-port="1" to-layer="1375" to-port="1" /> <edge from-layer="1375" from-port="2" to-layer="1376" to-port="1" /> <edge from-layer="1376" from-port="2" to-layer="1377" to-port="1" /> <edge from-layer="1377" from-port="2" to-layer="1451" to-port="0" /> <edge from-layer="1377" from-port="2" to-layer="1416" to-port="0" /> <edge from-layer="1377" from-port="2" to-layer="1386" to-port="0" /> <edge from-layer="1378" from-port="0" to-layer="1379" to-port="0" /> <edge from-layer="1379" from-port="1" to-layer="1382" to-port="0" /> <edge from-layer="1380" from-port="0" to-layer="1381" to-port="0" /> <edge from-layer="1381" from-port="1" to-layer="1382" to-port="1" /> <edge from-layer="1382" from-port="2" to-layer="1384" to-port="0" /> <edge from-layer="1383" from-port="0" to-layer="1384" to-port="1" /> <edge from-layer="1384" from-port="2" to-layer="1385" to-port="0" /> <edge from-layer="1385" from-port="1" to-layer="1386" to-port="1" /> <edge from-layer="1386" from-port="2" to-layer="1388" to-port="0" /> <edge from-layer="1387" from-port="0" to-layer="1388" to-port="1" /> <edge from-layer="1388" from-port="2" to-layer="1390" to-port="0" /> <edge from-layer="1389" from-port="0" to-layer="1390" to-port="1" /> <edge from-layer="1390" from-port="2" to-layer="1395" to-port="0" /> <edge from-layer="1390" from-port="2" to-layer="1401" to-port="0" /> <edge from-layer="1390" from-port="2" to-layer="1391" to-port="0" /> <edge from-layer="1391" from-port="2" to-layer="1404" to-port="0" /> <edge from-layer="1392" from-port="0" to-layer="1395" to-port="1" /> <edge from-layer="1393" from-port="0" to-layer="1395" to-port="2" /> <edge from-layer="1394" from-port="0" to-layer="1395" to-port="3" /> <edge from-layer="1395" from-port="5" to-layer="1397" to-port="0" /> <edge from-layer="1396" from-port="0" to-layer="1397" to-port="1" /> <edge from-layer="1397" from-port="2" to-layer="1402" to-port="0" /> <edge from-layer="1398" from-port="0" to-layer="1401" to-port="1" /> <edge from-layer="1399" from-port="0" to-layer="1401" to-port="2" /> <edge from-layer="1400" from-port="0" to-layer="1401" to-port="3" /> <edge from-layer="1401" from-port="5" to-layer="1402" to-port="1" /> <edge from-layer="1402" from-port="2" to-layer="1403" to-port="0" /> <edge from-layer="1403" from-port="2" to-layer="1404" to-port="1" /> <edge from-layer="1404" from-port="2" to-layer="1461" to-port="0" /> <edge from-layer="1405" from-port="1" to-layer="1407" to-port="0" /> <edge from-layer="1406" from-port="0" to-layer="1407" to-port="2" /> <edge from-layer="1407" from-port="3" to-layer="1435" to-port="0" /> <edge from-layer="1408" from-port="0" to-layer="1409" to-port="0" /> <edge from-layer="1409" from-port="1" to-layer="1412" to-port="0" /> <edge from-layer="1410" from-port="0" to-layer="1411" to-port="0" /> <edge from-layer="1411" from-port="1" to-layer="1412" to-port="1" /> <edge from-layer="1412" from-port="2" to-layer="1414" to-port="0" /> <edge from-layer="1413" from-port="0" to-layer="1414" to-port="1" /> <edge from-layer="1414" from-port="2" to-layer="1415" to-port="0" /> <edge from-layer="1415" from-port="1" to-layer="1416" to-port="1" /> <edge from-layer="1416" from-port="2" to-layer="1418" to-port="0" /> <edge from-layer="1417" from-port="0" to-layer="1418" to-port="1" /> <edge from-layer="1418" from-port="2" to-layer="1420" to-port="0" /> <edge from-layer="1419" from-port="0" to-layer="1420" to-port="1" /> <edge from-layer="1420" from-port="2" to-layer="1421" to-port="0" /> <edge from-layer="1420" from-port="2" to-layer="1425" to-port="0" /> <edge from-layer="1420" from-port="2" to-layer="1431" to-port="0" /> <edge from-layer="1421" from-port="2" to-layer="1434" to-port="0" /> <edge from-layer="1422" from-port="0" to-layer="1425" to-port="1" /> <edge from-layer="1423" from-port="0" to-layer="1425" to-port="2" /> <edge from-layer="1424" from-port="0" to-layer="1425" to-port="3" /> <edge from-layer="1425" from-port="5" to-layer="1427" to-port="0" /> <edge from-layer="1426" from-port="0" to-layer="1427" to-port="1" /> <edge from-layer="1427" from-port="2" to-layer="1432" to-port="0" /> <edge from-layer="1428" from-port="0" to-layer="1431" to-port="1" /> <edge from-layer="1429" from-port="0" to-layer="1431" to-port="2" /> <edge from-layer="1430" from-port="0" to-layer="1431" to-port="3" /> <edge from-layer="1431" from-port="5" to-layer="1432" to-port="1" /> <edge from-layer="1432" from-port="2" to-layer="1433" to-port="0" /> <edge from-layer="1433" from-port="2" to-layer="1434" to-port="1" /> <edge from-layer="1434" from-port="2" to-layer="1435" to-port="1" /> <edge from-layer="1435" from-port="2" to-layer="1576" to-port="0" /> <edge from-layer="1435" from-port="2" to-layer="1436" to-port="0" /> <edge from-layer="1436" from-port="2" to-layer="1437" to-port="0" /> <edge from-layer="1437" from-port="2" to-layer="1439" to-port="0" /> <edge from-layer="1438" from-port="0" to-layer="1439" to-port="1" /> <edge from-layer="1439" from-port="2" to-layer="1461" to-port="1" /> <edge from-layer="1440" from-port="1" to-layer="1442" to-port="0" /> <edge from-layer="1441" from-port="0" to-layer="1442" to-port="2" /> <edge from-layer="1442" from-port="3" to-layer="1456" to-port="0" /> <edge from-layer="1443" from-port="0" to-layer="1444" to-port="0" /> <edge from-layer="1444" from-port="1" to-layer="1447" to-port="0" /> <edge from-layer="1445" from-port="0" to-layer="1446" to-port="0" /> <edge from-layer="1446" from-port="1" to-layer="1447" to-port="1" /> <edge from-layer="1447" from-port="2" to-layer="1449" to-port="0" /> <edge from-layer="1448" from-port="0" to-layer="1449" to-port="1" /> <edge from-layer="1449" from-port="2" to-layer="1450" to-port="0" /> <edge from-layer="1450" from-port="1" to-layer="1451" to-port="1" /> <edge from-layer="1451" from-port="2" to-layer="1453" to-port="0" /> <edge from-layer="1452" from-port="0" to-layer="1453" to-port="1" /> <edge from-layer="1453" from-port="2" to-layer="1455" to-port="0" /> <edge from-layer="1454" from-port="0" to-layer="1455" to-port="1" /> <edge from-layer="1455" from-port="2" to-layer="1456" to-port="1" /> <edge from-layer="1456" from-port="2" to-layer="1457" to-port="0" /> <edge from-layer="1456" from-port="2" to-layer="1575" to-port="0" /> <edge from-layer="1457" from-port="2" to-layer="1458" to-port="0" /> <edge from-layer="1458" from-port="2" to-layer="1460" to-port="0" /> <edge from-layer="1459" from-port="0" to-layer="1460" to-port="1" /> <edge from-layer="1460" from-port="2" to-layer="1461" to-port="2" /> <edge from-layer="1461" from-port="4" to-layer="1463" to-port="0" /> <edge from-layer="1462" from-port="0" to-layer="1463" to-port="1" /> <edge from-layer="1463" from-port="2" to-layer="1464" to-port="0" /> <edge from-layer="1464" from-port="2" to-layer="1473" to-port="0" /> <edge from-layer="1465" from-port="0" to-layer="1466" to-port="0" /> <edge from-layer="1466" from-port="1" to-layer="1469" to-port="0" /> <edge from-layer="1467" from-port="0" to-layer="1468" to-port="0" /> <edge from-layer="1468" from-port="1" to-layer="1469" to-port="1" /> <edge from-layer="1469" from-port="2" to-layer="1471" to-port="0" /> <edge from-layer="1470" from-port="0" to-layer="1471" to-port="1" /> <edge from-layer="1471" from-port="2" to-layer="1472" to-port="0" /> <edge from-layer="1472" from-port="1" to-layer="1473" to-port="1" /> <edge from-layer="1473" from-port="2" to-layer="1474" to-port="1" /> <edge from-layer="1474" from-port="2" to-layer="1478" to-port="0" /> <edge from-layer="1474" from-port="2" to-layer="1516" to-port="0" /> <edge from-layer="1474" from-port="2" to-layer="1485" to-port="0" /> <edge from-layer="1475" from-port="0" to-layer="1486" to-port="0" /> <edge from-layer="1476" from-port="0" to-layer="1484" to-port="0" /> <edge from-layer="1477" from-port="0" to-layer="1478" to-port="1" /> <edge from-layer="1478" from-port="2" to-layer="1480" to-port="0" /> <edge from-layer="1479" from-port="0" to-layer="1480" to-port="1" /> <edge from-layer="1480" from-port="2" to-layer="1482" to-port="0" /> <edge from-layer="1481" from-port="0" to-layer="1482" to-port="1" /> <edge from-layer="1482" from-port="2" to-layer="1483" to-port="0" /> <edge from-layer="1483" from-port="1" to-layer="1484" to-port="1" /> <edge from-layer="1484" from-port="2" to-layer="1485" to-port="1" /> <edge from-layer="1485" from-port="2" to-layer="1486" to-port="1" /> <edge from-layer="1486" from-port="2" to-layer="1495" to-port="0" /> <edge from-layer="1486" from-port="2" to-layer="1505" to-port="0" /> <edge from-layer="1487" from-port="0" to-layer="1488" to-port="0" /> <edge from-layer="1488" from-port="1" to-layer="1491" to-port="0" /> <edge from-layer="1489" from-port="0" to-layer="1490" to-port="0" /> <edge from-layer="1490" from-port="1" to-layer="1491" to-port="1" /> <edge from-layer="1491" from-port="2" to-layer="1493" to-port="0" /> <edge from-layer="1492" from-port="0" to-layer="1493" to-port="1" /> <edge from-layer="1493" from-port="2" to-layer="1494" to-port="0" /> <edge from-layer="1494" from-port="1" to-layer="1495" to-port="1" /> <edge from-layer="1495" from-port="2" to-layer="1496" to-port="0" /> <edge from-layer="1496" from-port="1" to-layer="1506" to-port="0" /> <edge from-layer="1497" from-port="0" to-layer="1498" to-port="0" /> <edge from-layer="1498" from-port="1" to-layer="1501" to-port="0" /> <edge from-layer="1499" from-port="0" to-layer="1500" to-port="0" /> <edge from-layer="1500" from-port="1" to-layer="1501" to-port="1" /> <edge from-layer="1501" from-port="2" to-layer="1503" to-port="0" /> <edge from-layer="1502" from-port="0" to-layer="1503" to-port="1" /> <edge from-layer="1503" from-port="2" to-layer="1504" to-port="0" /> <edge from-layer="1504" from-port="1" to-layer="1505" to-port="1" /> <edge from-layer="1505" from-port="2" to-layer="1506" to-port="1" /> <edge from-layer="1506" from-port="2" to-layer="1515" to-port="0" /> <edge from-layer="1507" from-port="0" to-layer="1508" to-port="0" /> <edge from-layer="1508" from-port="1" to-layer="1511" to-port="0" /> <edge from-layer="1509" from-port="0" to-layer="1510" to-port="0" /> <edge from-layer="1510" from-port="1" to-layer="1511" to-port="1" /> <edge from-layer="1511" from-port="2" to-layer="1513" to-port="0" /> <edge from-layer="1512" from-port="0" to-layer="1513" to-port="1" /> <edge from-layer="1513" from-port="2" to-layer="1514" to-port="0" /> <edge from-layer="1514" from-port="1" to-layer="1515" to-port="1" /> <edge from-layer="1515" from-port="2" to-layer="1516" to-port="1" /> <edge from-layer="1516" from-port="2" to-layer="1519" to-port="0" /> <edge from-layer="1516" from-port="2" to-layer="1637" to-port="0" /> <edge from-layer="1516" from-port="2" to-layer="1526" to-port="0" /> <edge from-layer="1517" from-port="0" to-layer="1525" to-port="0" /> <edge from-layer="1518" from-port="0" to-layer="1519" to-port="1" /> <edge from-layer="1519" from-port="2" to-layer="1521" to-port="0" /> <edge from-layer="1520" from-port="0" to-layer="1521" to-port="1" /> <edge from-layer="1521" from-port="2" to-layer="1523" to-port="0" /> <edge from-layer="1522" from-port="0" to-layer="1523" to-port="1" /> <edge from-layer="1523" from-port="2" to-layer="1524" to-port="0" /> <edge from-layer="1524" from-port="1" to-layer="1525" to-port="1" /> <edge from-layer="1525" from-port="2" to-layer="1526" to-port="1" /> <edge from-layer="1526" from-port="2" to-layer="1527" to-port="1" /> <edge from-layer="1527" from-port="2" to-layer="1597" to-port="0" /> <edge from-layer="1527" from-port="2" to-layer="1554" to-port="0" /> <edge from-layer="1527" from-port="2" to-layer="1536" to-port="0" /> <edge from-layer="1528" from-port="0" to-layer="1529" to-port="0" /> <edge from-layer="1529" from-port="1" to-layer="1532" to-port="0" /> <edge from-layer="1530" from-port="0" to-layer="1531" to-port="0" /> <edge from-layer="1531" from-port="1" to-layer="1532" to-port="1" /> <edge from-layer="1532" from-port="2" to-layer="1534" to-port="0" /> <edge from-layer="1533" from-port="0" to-layer="1534" to-port="1" /> <edge from-layer="1534" from-port="2" to-layer="1535" to-port="0" /> <edge from-layer="1535" from-port="1" to-layer="1536" to-port="1" /> <edge from-layer="1536" from-port="2" to-layer="1538" to-port="0" /> <edge from-layer="1537" from-port="0" to-layer="1538" to-port="1" /> <edge from-layer="1538" from-port="2" to-layer="1540" to-port="0" /> <edge from-layer="1539" from-port="0" to-layer="1540" to-port="1" /> <edge from-layer="1540" from-port="2" to-layer="1541" to-port="1" /> <edge from-layer="1541" from-port="2" to-layer="1542" to-port="0" /> <edge from-layer="1541" from-port="2" to-layer="1620" to-port="0" /> <edge from-layer="1543" from-port="1" to-layer="1545" to-port="0" /> <edge from-layer="1544" from-port="0" to-layer="1545" to-port="2" /> <edge from-layer="1545" from-port="3" to-layer="1573" to-port="0" /> <edge from-layer="1546" from-port="0" to-layer="1547" to-port="0" /> <edge from-layer="1547" from-port="1" to-layer="1550" to-port="0" /> <edge from-layer="1548" from-port="0" to-layer="1549" to-port="0" /> <edge from-layer="1549" from-port="1" to-layer="1550" to-port="1" /> <edge from-layer="1550" from-port="2" to-layer="1552" to-port="0" /> <edge from-layer="1551" from-port="0" to-layer="1552" to-port="1" /> <edge from-layer="1552" from-port="2" to-layer="1553" to-port="0" /> <edge from-layer="1553" from-port="1" to-layer="1554" to-port="1" /> <edge from-layer="1554" from-port="2" to-layer="1556" to-port="0" /> <edge from-layer="1555" from-port="0" to-layer="1556" to-port="1" /> <edge from-layer="1556" from-port="2" to-layer="1558" to-port="0" /> <edge from-layer="1557" from-port="0" to-layer="1558" to-port="1" /> <edge from-layer="1558" from-port="2" to-layer="1569" to-port="0" /> <edge from-layer="1558" from-port="2" to-layer="1559" to-port="0" /> <edge from-layer="1558" from-port="2" to-layer="1563" to-port="0" /> <edge from-layer="1559" from-port="2" to-layer="1572" to-port="0" /> <edge from-layer="1560" from-port="0" to-layer="1563" to-port="1" /> <edge from-layer="1561" from-port="0" to-layer="1563" to-port="2" /> <edge from-layer="1562" from-port="0" to-layer="1563" to-port="3" /> <edge from-layer="1563" from-port="5" to-layer="1565" to-port="0" /> <edge from-layer="1564" from-port="0" to-layer="1565" to-port="1" /> <edge from-layer="1565" from-port="2" to-layer="1570" to-port="0" /> <edge from-layer="1566" from-port="0" to-layer="1569" to-port="1" /> <edge from-layer="1567" from-port="0" to-layer="1569" to-port="2" /> <edge from-layer="1568" from-port="0" to-layer="1569" to-port="3" /> <edge from-layer="1569" from-port="5" to-layer="1570" to-port="1" /> <edge from-layer="1570" from-port="2" to-layer="1571" to-port="0" /> <edge from-layer="1571" from-port="2" to-layer="1572" to-port="1" /> <edge from-layer="1572" from-port="2" to-layer="1573" to-port="1" /> <edge from-layer="1573" from-port="2" to-layer="1616" to-port="0" /> <edge from-layer="1573" from-port="2" to-layer="1574" to-port="0" /> <edge from-layer="1585" from-port="1" to-layer="1587" to-port="0" /> <edge from-layer="1586" from-port="0" to-layer="1587" to-port="2" /> <edge from-layer="1587" from-port="3" to-layer="6083" to-port="0" /> <edge from-layer="1588" from-port="0" to-layer="6069" to-port="0" /> <edge from-layer="1589" from-port="0" to-layer="1590" to-port="0" /> <edge from-layer="1590" from-port="1" to-layer="1593" to-port="0" /> <edge from-layer="1591" from-port="0" to-layer="1592" to-port="0" /> <edge from-layer="1592" from-port="1" to-layer="1593" to-port="1" /> <edge from-layer="1593" from-port="2" to-layer="1595" to-port="0" /> <edge from-layer="1594" from-port="0" to-layer="1595" to-port="1" /> <edge from-layer="1595" from-port="2" to-layer="1596" to-port="0" /> <edge from-layer="1596" from-port="1" to-layer="1597" to-port="1" /> <edge from-layer="1597" from-port="2" to-layer="1599" to-port="0" /> <edge from-layer="1598" from-port="0" to-layer="1599" to-port="1" /> <edge from-layer="1599" from-port="2" to-layer="1601" to-port="0" /> <edge from-layer="1600" from-port="0" to-layer="1601" to-port="1" /> <edge from-layer="1601" from-port="2" to-layer="1602" to-port="0" /> <edge from-layer="1601" from-port="2" to-layer="1606" to-port="0" /> <edge from-layer="1601" from-port="2" to-layer="1612" to-port="0" /> <edge from-layer="1602" from-port="2" to-layer="1615" to-port="0" /> <edge from-layer="1603" from-port="0" to-layer="1606" to-port="1" /> <edge from-layer="1604" from-port="0" to-layer="1606" to-port="2" /> <edge from-layer="1605" from-port="0" to-layer="1606" to-port="3" /> <edge from-layer="1606" from-port="5" to-layer="1608" to-port="0" /> <edge from-layer="1607" from-port="0" to-layer="1608" to-port="1" /> <edge from-layer="1608" from-port="2" to-layer="1613" to-port="0" /> <edge from-layer="1609" from-port="0" to-layer="1612" to-port="1" /> <edge from-layer="1610" from-port="0" to-layer="1612" to-port="2" /> <edge from-layer="1611" from-port="0" to-layer="1612" to-port="3" /> <edge from-layer="1612" from-port="5" to-layer="1613" to-port="1" /> <edge from-layer="1613" from-port="2" to-layer="1614" to-port="0" /> <edge from-layer="1614" from-port="2" to-layer="1615" to-port="1" /> <edge from-layer="1615" from-port="2" to-layer="1624" to-port="0" /> <edge from-layer="1616" from-port="2" to-layer="1617" to-port="0" /> <edge from-layer="1617" from-port="2" to-layer="1619" to-port="0" /> <edge from-layer="1618" from-port="0" to-layer="1619" to-port="1" /> <edge from-layer="1619" from-port="2" to-layer="1624" to-port="1" /> <edge from-layer="1620" from-port="2" to-layer="1621" to-port="0" /> <edge from-layer="1621" from-port="2" to-layer="1623" to-port="0" /> <edge from-layer="1622" from-port="0" to-layer="1623" to-port="1" /> <edge from-layer="1623" from-port="2" to-layer="1624" to-port="2" /> <edge from-layer="1624" from-port="4" to-layer="1626" to-port="0" /> <edge from-layer="1625" from-port="0" to-layer="1626" to-port="1" /> <edge from-layer="1626" from-port="2" to-layer="1627" to-port="0" /> <edge from-layer="1627" from-port="2" to-layer="1636" to-port="0" /> <edge from-layer="1628" from-port="0" to-layer="1629" to-port="0" /> <edge from-layer="1629" from-port="1" to-layer="1632" to-port="0" /> <edge from-layer="1630" from-port="0" to-layer="1631" to-port="0" /> <edge from-layer="1631" from-port="1" to-layer="1632" to-port="1" /> <edge from-layer="1632" from-port="2" to-layer="1634" to-port="0" /> <edge from-layer="1633" from-port="0" to-layer="1634" to-port="1" /> <edge from-layer="1634" from-port="2" to-layer="1635" to-port="0" /> <edge from-layer="1635" from-port="1" to-layer="1636" to-port="1" /> <edge from-layer="1636" from-port="2" to-layer="1637" to-port="1" /> <edge from-layer="1637" from-port="2" to-layer="1641" to-port="0" /> <edge from-layer="1637" from-port="2" to-layer="1679" to-port="0" /> <edge from-layer="1637" from-port="2" to-layer="1648" to-port="0" /> <edge from-layer="1638" from-port="0" to-layer="1649" to-port="0" /> <edge from-layer="1639" from-port="0" to-layer="1647" to-port="0" /> <edge from-layer="1640" from-port="0" to-layer="1641" to-port="1" /> <edge from-layer="1641" from-port="2" to-layer="1643" to-port="0" /> <edge from-layer="1642" from-port="0" to-layer="1643" to-port="1" /> <edge from-layer="1643" from-port="2" to-layer="1645" to-port="0" /> <edge from-layer="1644" from-port="0" to-layer="1645" to-port="1" /> <edge from-layer="1645" from-port="2" to-layer="1646" to-port="0" /> <edge from-layer="1646" from-port="1" to-layer="1647" to-port="1" /> <edge from-layer="1647" from-port="2" to-layer="1648" to-port="1" /> <edge from-layer="1648" from-port="2" to-layer="1649" to-port="1" /> <edge from-layer="1649" from-port="2" to-layer="1668" to-port="0" /> <edge from-layer="1649" from-port="2" to-layer="1658" to-port="0" /> <edge from-layer="1650" from-port="0" to-layer="1651" to-port="0" /> <edge from-layer="1651" from-port="1" to-layer="1654" to-port="0" /> <edge from-layer="1652" from-port="0" to-layer="1653" to-port="0" /> <edge from-layer="1653" from-port="1" to-layer="1654" to-port="1" /> <edge from-layer="1654" from-port="2" to-layer="1656" to-port="0" /> <edge from-layer="1655" from-port="0" to-layer="1656" to-port="1" /> <edge from-layer="1656" from-port="2" to-layer="1657" to-port="0" /> <edge from-layer="1657" from-port="1" to-layer="1658" to-port="1" /> <edge from-layer="1658" from-port="2" to-layer="1659" to-port="0" /> <edge from-layer="1659" from-port="1" to-layer="1669" to-port="0" /> <edge from-layer="1660" from-port="0" to-layer="1661" to-port="0" /> <edge from-layer="1661" from-port="1" to-layer="1664" to-port="0" /> <edge from-layer="1662" from-port="0" to-layer="1663" to-port="0" /> <edge from-layer="1663" from-port="1" to-layer="1664" to-port="1" /> <edge from-layer="1664" from-port="2" to-layer="1666" to-port="0" /> <edge from-layer="1665" from-port="0" to-layer="1666" to-port="1" /> <edge from-layer="1666" from-port="2" to-layer="1667" to-port="0" /> <edge from-layer="1667" from-port="1" to-layer="1668" to-port="1" /> <edge from-layer="1668" from-port="2" to-layer="1669" to-port="1" /> <edge from-layer="1669" from-port="2" to-layer="1678" to-port="0" /> <edge from-layer="1670" from-port="0" to-layer="1671" to-port="0" /> <edge from-layer="1671" from-port="1" to-layer="1674" to-port="0" /> <edge from-layer="1672" from-port="0" to-layer="1673" to-port="0" /> <edge from-layer="1673" from-port="1" to-layer="1674" to-port="1" /> <edge from-layer="1674" from-port="2" to-layer="1676" to-port="0" /> <edge from-layer="1675" from-port="0" to-layer="1676" to-port="1" /> <edge from-layer="1676" from-port="2" to-layer="1677" to-port="0" /> <edge from-layer="1677" from-port="1" to-layer="1678" to-port="1" /> <edge from-layer="1678" from-port="2" to-layer="1679" to-port="1" /> <edge from-layer="1679" from-port="2" to-layer="1683" to-port="0" /> <edge from-layer="1679" from-port="2" to-layer="1690" to-port="0" /> <edge from-layer="1679" from-port="2" to-layer="1788" to-port="0" /> <edge from-layer="1680" from-port="0" to-layer="1691" to-port="0" /> <edge from-layer="1681" from-port="0" to-layer="1689" to-port="0" /> <edge from-layer="1682" from-port="0" to-layer="1683" to-port="1" /> <edge from-layer="1683" from-port="2" to-layer="1685" to-port="0" /> <edge from-layer="1684" from-port="0" to-layer="1685" to-port="1" /> <edge from-layer="1685" from-port="2" to-layer="1687" to-port="0" /> <edge from-layer="1686" from-port="0" to-layer="1687" to-port="1" /> <edge from-layer="1687" from-port="2" to-layer="1688" to-port="0" /> <edge from-layer="1688" from-port="1" to-layer="1689" to-port="1" /> <edge from-layer="1689" from-port="2" to-layer="1690" to-port="1" /> <edge from-layer="1690" from-port="2" to-layer="1691" to-port="1" /> <edge from-layer="1691" from-port="2" to-layer="1765" to-port="0" /> <edge from-layer="1691" from-port="2" to-layer="1730" to-port="0" /> <edge from-layer="1691" from-port="2" to-layer="1700" to-port="0" /> <edge from-layer="1692" from-port="0" to-layer="1693" to-port="0" /> <edge from-layer="1693" from-port="1" to-layer="1696" to-port="0" /> <edge from-layer="1694" from-port="0" to-layer="1695" to-port="0" /> <edge from-layer="1695" from-port="1" to-layer="1696" to-port="1" /> <edge from-layer="1696" from-port="2" to-layer="1698" to-port="0" /> <edge from-layer="1697" from-port="0" to-layer="1698" to-port="1" /> <edge from-layer="1698" from-port="2" to-layer="1699" to-port="0" /> <edge from-layer="1699" from-port="1" to-layer="1700" to-port="1" /> <edge from-layer="1700" from-port="2" to-layer="1702" to-port="0" /> <edge from-layer="1701" from-port="0" to-layer="1702" to-port="1" /> <edge from-layer="1702" from-port="2" to-layer="1704" to-port="0" /> <edge from-layer="1703" from-port="0" to-layer="1704" to-port="1" /> <edge from-layer="1704" from-port="2" to-layer="1705" to-port="0" /> <edge from-layer="1704" from-port="2" to-layer="1709" to-port="0" /> <edge from-layer="1704" from-port="2" to-layer="1715" to-port="0" /> <edge from-layer="1705" from-port="2" to-layer="1718" to-port="0" /> <edge from-layer="1706" from-port="0" to-layer="1709" to-port="1" /> <edge from-layer="1707" from-port="0" to-layer="1709" to-port="2" /> <edge from-layer="1708" from-port="0" to-layer="1709" to-port="3" /> <edge from-layer="1709" from-port="5" to-layer="1711" to-port="0" /> <edge from-layer="1710" from-port="0" to-layer="1711" to-port="1" /> <edge from-layer="1711" from-port="2" to-layer="1716" to-port="0" /> <edge from-layer="1712" from-port="0" to-layer="1715" to-port="1" /> <edge from-layer="1713" from-port="0" to-layer="1715" to-port="2" /> <edge from-layer="1714" from-port="0" to-layer="1715" to-port="3" /> <edge from-layer="1715" from-port="5" to-layer="1716" to-port="1" /> <edge from-layer="1716" from-port="2" to-layer="1717" to-port="0" /> <edge from-layer="1717" from-port="2" to-layer="1718" to-port="1" /> <edge from-layer="1718" from-port="2" to-layer="1775" to-port="0" /> <edge from-layer="1719" from-port="1" to-layer="1721" to-port="0" /> <edge from-layer="1720" from-port="0" to-layer="1721" to-port="2" /> <edge from-layer="1721" from-port="3" to-layer="1749" to-port="0" /> <edge from-layer="1722" from-port="0" to-layer="1723" to-port="0" /> <edge from-layer="1723" from-port="1" to-layer="1726" to-port="0" /> <edge from-layer="1724" from-port="0" to-layer="1725" to-port="0" /> <edge from-layer="1725" from-port="1" to-layer="1726" to-port="1" /> <edge from-layer="1726" from-port="2" to-layer="1728" to-port="0" /> <edge from-layer="1727" from-port="0" to-layer="1728" to-port="1" /> <edge from-layer="1728" from-port="2" to-layer="1729" to-port="0" /> <edge from-layer="1729" from-port="1" to-layer="1730" to-port="1" /> <edge from-layer="1730" from-port="2" to-layer="1732" to-port="0" /> <edge from-layer="1731" from-port="0" to-layer="1732" to-port="1" /> <edge from-layer="1732" from-port="2" to-layer="1734" to-port="0" /> <edge from-layer="1733" from-port="0" to-layer="1734" to-port="1" /> <edge from-layer="1734" from-port="2" to-layer="1745" to-port="0" /> <edge from-layer="1734" from-port="2" to-layer="1739" to-port="0" /> <edge from-layer="1734" from-port="2" to-layer="1735" to-port="0" /> <edge from-layer="1735" from-port="2" to-layer="1748" to-port="0" /> <edge from-layer="1736" from-port="0" to-layer="1739" to-port="1" /> <edge from-layer="1737" from-port="0" to-layer="1739" to-port="2" /> <edge from-layer="1738" from-port="0" to-layer="1739" to-port="3" /> <edge from-layer="1739" from-port="5" to-layer="1741" to-port="0" /> <edge from-layer="1740" from-port="0" to-layer="1741" to-port="1" /> <edge from-layer="1741" from-port="2" to-layer="1746" to-port="0" /> <edge from-layer="1742" from-port="0" to-layer="1745" to-port="1" /> <edge from-layer="1743" from-port="0" to-layer="1745" to-port="2" /> <edge from-layer="1744" from-port="0" to-layer="1745" to-port="3" /> <edge from-layer="1745" from-port="5" to-layer="1746" to-port="1" /> <edge from-layer="1746" from-port="2" to-layer="1747" to-port="0" /> <edge from-layer="1747" from-port="2" to-layer="1748" to-port="1" /> <edge from-layer="1748" from-port="2" to-layer="1749" to-port="1" /> <edge from-layer="1749" from-port="2" to-layer="1750" to-port="0" /> <edge from-layer="1749" from-port="2" to-layer="6178" to-port="0" /> <edge from-layer="1750" from-port="2" to-layer="1751" to-port="0" /> <edge from-layer="1751" from-port="2" to-layer="1753" to-port="0" /> <edge from-layer="1752" from-port="0" to-layer="1753" to-port="1" /> <edge from-layer="1753" from-port="2" to-layer="1775" to-port="1" /> <edge from-layer="1754" from-port="1" to-layer="1756" to-port="0" /> <edge from-layer="1755" from-port="0" to-layer="1756" to-port="2" /> <edge from-layer="1756" from-port="3" to-layer="1770" to-port="0" /> <edge from-layer="1757" from-port="0" to-layer="1758" to-port="0" /> <edge from-layer="1758" from-port="1" to-layer="1761" to-port="0" /> <edge from-layer="1759" from-port="0" to-layer="1760" to-port="0" /> <edge from-layer="1760" from-port="1" to-layer="1761" to-port="1" /> <edge from-layer="1761" from-port="2" to-layer="1763" to-port="0" /> <edge from-layer="1762" from-port="0" to-layer="1763" to-port="1" /> <edge from-layer="1763" from-port="2" to-layer="1764" to-port="0" /> <edge from-layer="1764" from-port="1" to-layer="1765" to-port="1" /> <edge from-layer="1765" from-port="2" to-layer="1767" to-port="0" /> <edge from-layer="1766" from-port="0" to-layer="1767" to-port="1" /> <edge from-layer="1767" from-port="2" to-layer="1769" to-port="0" /> <edge from-layer="1768" from-port="0" to-layer="1769" to-port="1" /> <edge from-layer="1769" from-port="2" to-layer="1770" to-port="1" /> <edge from-layer="1770" from-port="2" to-layer="1771" to-port="0" /> <edge from-layer="1770" from-port="2" to-layer="6177" to-port="0" /> <edge from-layer="1771" from-port="2" to-layer="1772" to-port="0" /> <edge from-layer="1772" from-port="2" to-layer="1774" to-port="0" /> <edge from-layer="1773" from-port="0" to-layer="1774" to-port="1" /> <edge from-layer="1774" from-port="2" to-layer="1775" to-port="2" /> <edge from-layer="1775" from-port="4" to-layer="1777" to-port="0" /> <edge from-layer="1776" from-port="0" to-layer="1777" to-port="1" /> <edge from-layer="1777" from-port="2" to-layer="1778" to-port="0" /> <edge from-layer="1778" from-port="2" to-layer="1787" to-port="0" /> <edge from-layer="1779" from-port="0" to-layer="1780" to-port="0" /> <edge from-layer="1780" from-port="1" to-layer="1783" to-port="0" /> <edge from-layer="1781" from-port="0" to-layer="1782" to-port="0" /> <edge from-layer="1782" from-port="1" to-layer="1783" to-port="1" /> <edge from-layer="1783" from-port="2" to-layer="1785" to-port="0" /> <edge from-layer="1784" from-port="0" to-layer="1785" to-port="1" /> <edge from-layer="1785" from-port="2" to-layer="1786" to-port="0" /> <edge from-layer="1786" from-port="1" to-layer="1787" to-port="1" /> <edge from-layer="1787" from-port="2" to-layer="1788" to-port="1" /> <edge from-layer="1788" from-port="2" to-layer="1830" to-port="0" /> <edge from-layer="1788" from-port="2" to-layer="1792" to-port="0" /> <edge from-layer="1788" from-port="2" to-layer="1799" to-port="0" /> <edge from-layer="1789" from-port="0" to-layer="1800" to-port="0" /> <edge from-layer="1790" from-port="0" to-layer="1798" to-port="0" /> <edge from-layer="1791" from-port="0" to-layer="1792" to-port="1" /> <edge from-layer="1792" from-port="2" to-layer="1794" to-port="0" /> <edge from-layer="1793" from-port="0" to-layer="1794" to-port="1" /> <edge from-layer="1794" from-port="2" to-layer="1796" to-port="0" /> <edge from-layer="1795" from-port="0" to-layer="1796" to-port="1" /> <edge from-layer="1796" from-port="2" to-layer="1797" to-port="0" /> <edge from-layer="1797" from-port="1" to-layer="1798" to-port="1" /> <edge from-layer="1798" from-port="2" to-layer="1799" to-port="1" /> <edge from-layer="1799" from-port="2" to-layer="1800" to-port="1" /> <edge from-layer="1800" from-port="2" to-layer="1809" to-port="0" /> <edge from-layer="1800" from-port="2" to-layer="1819" to-port="0" /> <edge from-layer="1801" from-port="0" to-layer="1802" to-port="0" /> <edge from-layer="1802" from-port="1" to-layer="1805" to-port="0" /> <edge from-layer="1803" from-port="0" to-layer="1804" to-port="0" /> <edge from-layer="1804" from-port="1" to-layer="1805" to-port="1" /> <edge from-layer="1805" from-port="2" to-layer="1807" to-port="0" /> <edge from-layer="1806" from-port="0" to-layer="1807" to-port="1" /> <edge from-layer="1807" from-port="2" to-layer="1808" to-port="0" /> <edge from-layer="1808" from-port="1" to-layer="1809" to-port="1" /> <edge from-layer="1809" from-port="2" to-layer="1810" to-port="0" /> <edge from-layer="1810" from-port="1" to-layer="1820" to-port="0" /> <edge from-layer="1811" from-port="0" to-layer="1812" to-port="0" /> <edge from-layer="1812" from-port="1" to-layer="1815" to-port="0" /> <edge from-layer="1813" from-port="0" to-layer="1814" to-port="0" /> <edge from-layer="1814" from-port="1" to-layer="1815" to-port="1" /> <edge from-layer="1815" from-port="2" to-layer="1817" to-port="0" /> <edge from-layer="1816" from-port="0" to-layer="1817" to-port="1" /> <edge from-layer="1817" from-port="2" to-layer="1818" to-port="0" /> <edge from-layer="1818" from-port="1" to-layer="1819" to-port="1" /> <edge from-layer="1819" from-port="2" to-layer="1820" to-port="1" /> <edge from-layer="1820" from-port="2" to-layer="1829" to-port="0" /> <edge from-layer="1821" from-port="0" to-layer="1822" to-port="0" /> <edge from-layer="1822" from-port="1" to-layer="1825" to-port="0" /> <edge from-layer="1823" from-port="0" to-layer="1824" to-port="0" /> <edge from-layer="1824" from-port="1" to-layer="1825" to-port="1" /> <edge from-layer="1825" from-port="2" to-layer="1827" to-port="0" /> <edge from-layer="1826" from-port="0" to-layer="1827" to-port="1" /> <edge from-layer="1827" from-port="2" to-layer="1828" to-port="0" /> <edge from-layer="1828" from-port="1" to-layer="1829" to-port="1" /> <edge from-layer="1829" from-port="2" to-layer="1830" to-port="1" /> <edge from-layer="1830" from-port="2" to-layer="1939" to-port="0" /> <edge from-layer="1830" from-port="2" to-layer="1841" to-port="0" /> <edge from-layer="1830" from-port="2" to-layer="1834" to-port="0" /> <edge from-layer="1831" from-port="0" to-layer="1842" to-port="0" /> <edge from-layer="1832" from-port="0" to-layer="1840" to-port="0" /> <edge from-layer="1833" from-port="0" to-layer="1834" to-port="1" /> <edge from-layer="1834" from-port="2" to-layer="1836" to-port="0" /> <edge from-layer="1835" from-port="0" to-layer="1836" to-port="1" /> <edge from-layer="1836" from-port="2" to-layer="1838" to-port="0" /> <edge from-layer="1837" from-port="0" to-layer="1838" to-port="1" /> <edge from-layer="1838" from-port="2" to-layer="1839" to-port="0" /> <edge from-layer="1839" from-port="1" to-layer="1840" to-port="1" /> <edge from-layer="1840" from-port="2" to-layer="1841" to-port="1" /> <edge from-layer="1841" from-port="2" to-layer="1842" to-port="1" /> <edge from-layer="1842" from-port="2" to-layer="1881" to-port="0" /> <edge from-layer="1842" from-port="2" to-layer="1916" to-port="0" /> <edge from-layer="1842" from-port="2" to-layer="1851" to-port="0" /> <edge from-layer="1843" from-port="0" to-layer="1844" to-port="0" /> <edge from-layer="1844" from-port="1" to-layer="1847" to-port="0" /> <edge from-layer="1845" from-port="0" to-layer="1846" to-port="0" /> <edge from-layer="1846" from-port="1" to-layer="1847" to-port="1" /> <edge from-layer="1847" from-port="2" to-layer="1849" to-port="0" /> <edge from-layer="1848" from-port="0" to-layer="1849" to-port="1" /> <edge from-layer="1849" from-port="2" to-layer="1850" to-port="0" /> <edge from-layer="1850" from-port="1" to-layer="1851" to-port="1" /> <edge from-layer="1851" from-port="2" to-layer="1853" to-port="0" /> <edge from-layer="1852" from-port="0" to-layer="1853" to-port="1" /> <edge from-layer="1853" from-port="2" to-layer="1855" to-port="0" /> <edge from-layer="1854" from-port="0" to-layer="1855" to-port="1" /> <edge from-layer="1855" from-port="2" to-layer="1860" to-port="0" /> <edge from-layer="1855" from-port="2" to-layer="1866" to-port="0" /> <edge from-layer="1855" from-port="2" to-layer="1856" to-port="0" /> <edge from-layer="1856" from-port="2" to-layer="1869" to-port="0" /> <edge from-layer="1857" from-port="0" to-layer="1860" to-port="1" /> <edge from-layer="1858" from-port="0" to-layer="1860" to-port="2" /> <edge from-layer="1859" from-port="0" to-layer="1860" to-port="3" /> <edge from-layer="1860" from-port="5" to-layer="1862" to-port="0" /> <edge from-layer="1861" from-port="0" to-layer="1862" to-port="1" /> <edge from-layer="1862" from-port="2" to-layer="1867" to-port="0" /> <edge from-layer="1863" from-port="0" to-layer="1866" to-port="1" /> <edge from-layer="1864" from-port="0" to-layer="1866" to-port="2" /> <edge from-layer="1865" from-port="0" to-layer="1866" to-port="3" /> <edge from-layer="1866" from-port="5" to-layer="1867" to-port="1" /> <edge from-layer="1867" from-port="2" to-layer="1868" to-port="0" /> <edge from-layer="1868" from-port="2" to-layer="1869" to-port="1" /> <edge from-layer="1869" from-port="2" to-layer="1926" to-port="0" /> <edge from-layer="1870" from-port="1" to-layer="1872" to-port="0" /> <edge from-layer="1871" from-port="0" to-layer="1872" to-port="2" /> <edge from-layer="1872" from-port="3" to-layer="1900" to-port="0" /> <edge from-layer="1873" from-port="0" to-layer="1874" to-port="0" /> <edge from-layer="1874" from-port="1" to-layer="1877" to-port="0" /> <edge from-layer="1875" from-port="0" to-layer="1876" to-port="0" /> <edge from-layer="1876" from-port="1" to-layer="1877" to-port="1" /> <edge from-layer="1877" from-port="2" to-layer="1879" to-port="0" /> <edge from-layer="1878" from-port="0" to-layer="1879" to-port="1" /> <edge from-layer="1879" from-port="2" to-layer="1880" to-port="0" /> <edge from-layer="1880" from-port="1" to-layer="1881" to-port="1" /> <edge from-layer="1881" from-port="2" to-layer="1883" to-port="0" /> <edge from-layer="1882" from-port="0" to-layer="1883" to-port="1" /> <edge from-layer="1883" from-port="2" to-layer="1885" to-port="0" /> <edge from-layer="1884" from-port="0" to-layer="1885" to-port="1" /> <edge from-layer="1885" from-port="2" to-layer="1886" to-port="0" /> <edge from-layer="1885" from-port="2" to-layer="1890" to-port="0" /> <edge from-layer="1885" from-port="2" to-layer="1896" to-port="0" /> <edge from-layer="1886" from-port="2" to-layer="1899" to-port="0" /> <edge from-layer="1887" from-port="0" to-layer="1890" to-port="1" /> <edge from-layer="1888" from-port="0" to-layer="1890" to-port="2" /> <edge from-layer="1889" from-port="0" to-layer="1890" to-port="3" /> <edge from-layer="1890" from-port="5" to-layer="1892" to-port="0" /> <edge from-layer="1891" from-port="0" to-layer="1892" to-port="1" /> <edge from-layer="1892" from-port="2" to-layer="1897" to-port="0" /> <edge from-layer="1893" from-port="0" to-layer="1896" to-port="1" /> <edge from-layer="1894" from-port="0" to-layer="1896" to-port="2" /> <edge from-layer="1895" from-port="0" to-layer="1896" to-port="3" /> <edge from-layer="1896" from-port="5" to-layer="1897" to-port="1" /> <edge from-layer="1897" from-port="2" to-layer="1898" to-port="0" /> <edge from-layer="1898" from-port="2" to-layer="1899" to-port="1" /> <edge from-layer="1899" from-port="2" to-layer="1900" to-port="1" /> <edge from-layer="1900" from-port="2" to-layer="6176" to-port="0" /> <edge from-layer="1900" from-port="2" to-layer="1901" to-port="0" /> <edge from-layer="1901" from-port="2" to-layer="1902" to-port="0" /> <edge from-layer="1902" from-port="2" to-layer="1904" to-port="0" /> <edge from-layer="1903" from-port="0" to-layer="1904" to-port="1" /> <edge from-layer="1904" from-port="2" to-layer="1926" to-port="1" /> <edge from-layer="1905" from-port="1" to-layer="1907" to-port="0" /> <edge from-layer="1906" from-port="0" to-layer="1907" to-port="2" /> <edge from-layer="1907" from-port="3" to-layer="1921" to-port="0" /> <edge from-layer="1908" from-port="0" to-layer="1909" to-port="0" /> <edge from-layer="1909" from-port="1" to-layer="1912" to-port="0" /> <edge from-layer="1910" from-port="0" to-layer="1911" to-port="0" /> <edge from-layer="1911" from-port="1" to-layer="1912" to-port="1" /> <edge from-layer="1912" from-port="2" to-layer="1914" to-port="0" /> <edge from-layer="1913" from-port="0" to-layer="1914" to-port="1" /> <edge from-layer="1914" from-port="2" to-layer="1915" to-port="0" /> <edge from-layer="1915" from-port="1" to-layer="1916" to-port="1" /> <edge from-layer="1916" from-port="2" to-layer="1918" to-port="0" /> <edge from-layer="1917" from-port="0" to-layer="1918" to-port="1" /> <edge from-layer="1918" from-port="2" to-layer="1920" to-port="0" /> <edge from-layer="1919" from-port="0" to-layer="1920" to-port="1" /> <edge from-layer="1920" from-port="2" to-layer="1921" to-port="1" /> <edge from-layer="1921" from-port="2" to-layer="6175" to-port="0" /> <edge from-layer="1921" from-port="2" to-layer="1922" to-port="0" /> <edge from-layer="1922" from-port="2" to-layer="1923" to-port="0" /> <edge from-layer="1923" from-port="2" to-layer="1925" to-port="0" /> <edge from-layer="1924" from-port="0" to-layer="1925" to-port="1" /> <edge from-layer="1925" from-port="2" to-layer="1926" to-port="2" /> <edge from-layer="1926" from-port="4" to-layer="1928" to-port="0" /> <edge from-layer="1927" from-port="0" to-layer="1928" to-port="1" /> <edge from-layer="1928" from-port="2" to-layer="1929" to-port="0" /> <edge from-layer="1929" from-port="2" to-layer="1938" to-port="0" /> <edge from-layer="1930" from-port="0" to-layer="1931" to-port="0" /> <edge from-layer="1931" from-port="1" to-layer="1934" to-port="0" /> <edge from-layer="1932" from-port="0" to-layer="1933" to-port="0" /> <edge from-layer="1933" from-port="1" to-layer="1934" to-port="1" /> <edge from-layer="1934" from-port="2" to-layer="1936" to-port="0" /> <edge from-layer="1935" from-port="0" to-layer="1936" to-port="1" /> <edge from-layer="1936" from-port="2" to-layer="1937" to-port="0" /> <edge from-layer="1937" from-port="1" to-layer="1938" to-port="1" /> <edge from-layer="1938" from-port="2" to-layer="1939" to-port="1" /> <edge from-layer="1939" from-port="2" to-layer="1943" to-port="0" /> <edge from-layer="1939" from-port="2" to-layer="1981" to-port="0" /> <edge from-layer="1939" from-port="2" to-layer="1950" to-port="0" /> <edge from-layer="1940" from-port="0" to-layer="1951" to-port="0" /> <edge from-layer="1941" from-port="0" to-layer="1949" to-port="0" /> <edge from-layer="1942" from-port="0" to-layer="1943" to-port="1" /> <edge from-layer="1943" from-port="2" to-layer="1945" to-port="0" /> <edge from-layer="1944" from-port="0" to-layer="1945" to-port="1" /> <edge from-layer="1945" from-port="2" to-layer="1947" to-port="0" /> <edge from-layer="1946" from-port="0" to-layer="1947" to-port="1" /> <edge from-layer="1947" from-port="2" to-layer="1948" to-port="0" /> <edge from-layer="1948" from-port="1" to-layer="1949" to-port="1" /> <edge from-layer="1949" from-port="2" to-layer="1950" to-port="1" /> <edge from-layer="1950" from-port="2" to-layer="1951" to-port="1" /> <edge from-layer="1951" from-port="2" to-layer="1970" to-port="0" /> <edge from-layer="1951" from-port="2" to-layer="1960" to-port="0" /> <edge from-layer="1952" from-port="0" to-layer="1953" to-port="0" /> <edge from-layer="1953" from-port="1" to-layer="1956" to-port="0" /> <edge from-layer="1954" from-port="0" to-layer="1955" to-port="0" /> <edge from-layer="1955" from-port="1" to-layer="1956" to-port="1" /> <edge from-layer="1956" from-port="2" to-layer="1958" to-port="0" /> <edge from-layer="1957" from-port="0" to-layer="1958" to-port="1" /> <edge from-layer="1958" from-port="2" to-layer="1959" to-port="0" /> <edge from-layer="1959" from-port="1" to-layer="1960" to-port="1" /> <edge from-layer="1960" from-port="2" to-layer="1961" to-port="0" /> <edge from-layer="1961" from-port="1" to-layer="1971" to-port="0" /> <edge from-layer="1962" from-port="0" to-layer="1963" to-port="0" /> <edge from-layer="1963" from-port="1" to-layer="1966" to-port="0" /> <edge from-layer="1964" from-port="0" to-layer="1965" to-port="0" /> <edge from-layer="1965" from-port="1" to-layer="1966" to-port="1" /> <edge from-layer="1966" from-port="2" to-layer="1968" to-port="0" /> <edge from-layer="1967" from-port="0" to-layer="1968" to-port="1" /> <edge from-layer="1968" from-port="2" to-layer="1969" to-port="0" /> <edge from-layer="1969" from-port="1" to-layer="1970" to-port="1" /> <edge from-layer="1970" from-port="2" to-layer="1971" to-port="1" /> <edge from-layer="1971" from-port="2" to-layer="1980" to-port="0" /> <edge from-layer="1972" from-port="0" to-layer="1973" to-port="0" /> <edge from-layer="1973" from-port="1" to-layer="1976" to-port="0" /> <edge from-layer="1974" from-port="0" to-layer="1975" to-port="0" /> <edge from-layer="1975" from-port="1" to-layer="1976" to-port="1" /> <edge from-layer="1976" from-port="2" to-layer="1978" to-port="0" /> <edge from-layer="1977" from-port="0" to-layer="1978" to-port="1" /> <edge from-layer="1978" from-port="2" to-layer="1979" to-port="0" /> <edge from-layer="1979" from-port="1" to-layer="1980" to-port="1" /> <edge from-layer="1980" from-port="2" to-layer="1981" to-port="1" /> <edge from-layer="1981" from-port="2" to-layer="1985" to-port="0" /> <edge from-layer="1981" from-port="2" to-layer="1992" to-port="0" /> <edge from-layer="1981" from-port="2" to-layer="2090" to-port="0" /> <edge from-layer="1982" from-port="0" to-layer="1993" to-port="0" /> <edge from-layer="1983" from-port="0" to-layer="1991" to-port="0" /> <edge from-layer="1984" from-port="0" to-layer="1985" to-port="1" /> <edge from-layer="1985" from-port="2" to-layer="1987" to-port="0" /> <edge from-layer="1986" from-port="0" to-layer="1987" to-port="1" /> <edge from-layer="1987" from-port="2" to-layer="1989" to-port="0" /> <edge from-layer="1988" from-port="0" to-layer="1989" to-port="1" /> <edge from-layer="1989" from-port="2" to-layer="1990" to-port="0" /> <edge from-layer="1990" from-port="1" to-layer="1991" to-port="1" /> <edge from-layer="1991" from-port="2" to-layer="1992" to-port="1" /> <edge from-layer="1992" from-port="2" to-layer="1993" to-port="1" /> <edge from-layer="1993" from-port="2" to-layer="2032" to-port="0" /> <edge from-layer="1993" from-port="2" to-layer="2067" to-port="0" /> <edge from-layer="1993" from-port="2" to-layer="2002" to-port="0" /> <edge from-layer="1994" from-port="0" to-layer="1995" to-port="0" /> <edge from-layer="1995" from-port="1" to-layer="1998" to-port="0" /> <edge from-layer="1996" from-port="0" to-layer="1997" to-port="0" /> <edge from-layer="1997" from-port="1" to-layer="1998" to-port="1" /> <edge from-layer="1998" from-port="2" to-layer="2000" to-port="0" /> <edge from-layer="1999" from-port="0" to-layer="2000" to-port="1" /> <edge from-layer="2000" from-port="2" to-layer="2001" to-port="0" /> <edge from-layer="2001" from-port="1" to-layer="2002" to-port="1" /> <edge from-layer="2002" from-port="2" to-layer="2004" to-port="0" /> <edge from-layer="2003" from-port="0" to-layer="2004" to-port="1" /> <edge from-layer="2004" from-port="2" to-layer="2006" to-port="0" /> <edge from-layer="2005" from-port="0" to-layer="2006" to-port="1" /> <edge from-layer="2006" from-port="2" to-layer="2007" to-port="0" /> <edge from-layer="2006" from-port="2" to-layer="2011" to-port="0" /> <edge from-layer="2006" from-port="2" to-layer="2017" to-port="0" /> <edge from-layer="2007" from-port="2" to-layer="2020" to-port="0" /> <edge from-layer="2008" from-port="0" to-layer="2011" to-port="1" /> <edge from-layer="2009" from-port="0" to-layer="2011" to-port="2" /> <edge from-layer="2010" from-port="0" to-layer="2011" to-port="3" /> <edge from-layer="2011" from-port="5" to-layer="2013" to-port="0" /> <edge from-layer="2012" from-port="0" to-layer="2013" to-port="1" /> <edge from-layer="2013" from-port="2" to-layer="2018" to-port="0" /> <edge from-layer="2014" from-port="0" to-layer="2017" to-port="1" /> <edge from-layer="2015" from-port="0" to-layer="2017" to-port="2" /> <edge from-layer="2016" from-port="0" to-layer="2017" to-port="3" /> <edge from-layer="2017" from-port="5" to-layer="2018" to-port="1" /> <edge from-layer="2018" from-port="2" to-layer="2019" to-port="0" /> <edge from-layer="2019" from-port="2" to-layer="2020" to-port="1" /> <edge from-layer="2020" from-port="2" to-layer="2077" to-port="0" /> <edge from-layer="2021" from-port="1" to-layer="2023" to-port="0" /> <edge from-layer="2022" from-port="0" to-layer="2023" to-port="2" /> <edge from-layer="2023" from-port="3" to-layer="2051" to-port="0" /> <edge from-layer="2024" from-port="0" to-layer="2025" to-port="0" /> <edge from-layer="2025" from-port="1" to-layer="2028" to-port="0" /> <edge from-layer="2026" from-port="0" to-layer="2027" to-port="0" /> <edge from-layer="2027" from-port="1" to-layer="2028" to-port="1" /> <edge from-layer="2028" from-port="2" to-layer="2030" to-port="0" /> <edge from-layer="2029" from-port="0" to-layer="2030" to-port="1" /> <edge from-layer="2030" from-port="2" to-layer="2031" to-port="0" /> <edge from-layer="2031" from-port="1" to-layer="2032" to-port="1" /> <edge from-layer="2032" from-port="2" to-layer="2034" to-port="0" /> <edge from-layer="2033" from-port="0" to-layer="2034" to-port="1" /> <edge from-layer="2034" from-port="2" to-layer="2036" to-port="0" /> <edge from-layer="2035" from-port="0" to-layer="2036" to-port="1" /> <edge from-layer="2036" from-port="2" to-layer="2047" to-port="0" /> <edge from-layer="2036" from-port="2" to-layer="2041" to-port="0" /> <edge from-layer="2036" from-port="2" to-layer="2037" to-port="0" /> <edge from-layer="2037" from-port="2" to-layer="2050" to-port="0" /> <edge from-layer="2038" from-port="0" to-layer="2041" to-port="1" /> <edge from-layer="2039" from-port="0" to-layer="2041" to-port="2" /> <edge from-layer="2040" from-port="0" to-layer="2041" to-port="3" /> <edge from-layer="2041" from-port="5" to-layer="2043" to-port="0" /> <edge from-layer="2042" from-port="0" to-layer="2043" to-port="1" /> <edge from-layer="2043" from-port="2" to-layer="2048" to-port="0" /> <edge from-layer="2044" from-port="0" to-layer="2047" to-port="1" /> <edge from-layer="2045" from-port="0" to-layer="2047" to-port="2" /> <edge from-layer="2046" from-port="0" to-layer="2047" to-port="3" /> <edge from-layer="2047" from-port="5" to-layer="2048" to-port="1" /> <edge from-layer="2048" from-port="2" to-layer="2049" to-port="0" /> <edge from-layer="2049" from-port="2" to-layer="2050" to-port="1" /> <edge from-layer="2050" from-port="2" to-layer="2051" to-port="1" /> <edge from-layer="2051" from-port="2" to-layer="2052" to-port="0" /> <edge from-layer="2051" from-port="2" to-layer="6174" to-port="0" /> <edge from-layer="2052" from-port="2" to-layer="2053" to-port="0" /> <edge from-layer="2053" from-port="2" to-layer="2055" to-port="0" /> <edge from-layer="2054" from-port="0" to-layer="2055" to-port="1" /> <edge from-layer="2055" from-port="2" to-layer="2077" to-port="1" /> <edge from-layer="2056" from-port="1" to-layer="2058" to-port="0" /> <edge from-layer="2057" from-port="0" to-layer="2058" to-port="2" /> <edge from-layer="2058" from-port="3" to-layer="2072" to-port="0" /> <edge from-layer="2059" from-port="0" to-layer="2060" to-port="0" /> <edge from-layer="2060" from-port="1" to-layer="2063" to-port="0" /> <edge from-layer="2061" from-port="0" to-layer="2062" to-port="0" /> <edge from-layer="2062" from-port="1" to-layer="2063" to-port="1" /> <edge from-layer="2063" from-port="2" to-layer="2065" to-port="0" /> <edge from-layer="2064" from-port="0" to-layer="2065" to-port="1" /> <edge from-layer="2065" from-port="2" to-layer="2066" to-port="0" /> <edge from-layer="2066" from-port="1" to-layer="2067" to-port="1" /> <edge from-layer="2067" from-port="2" to-layer="2069" to-port="0" /> <edge from-layer="2068" from-port="0" to-layer="2069" to-port="1" /> <edge from-layer="2069" from-port="2" to-layer="2071" to-port="0" /> <edge from-layer="2070" from-port="0" to-layer="2071" to-port="1" /> <edge from-layer="2071" from-port="2" to-layer="2072" to-port="1" /> <edge from-layer="2072" from-port="2" to-layer="2073" to-port="0" /> <edge from-layer="2072" from-port="2" to-layer="6173" to-port="0" /> <edge from-layer="2073" from-port="2" to-layer="2074" to-port="0" /> <edge from-layer="2074" from-port="2" to-layer="2076" to-port="0" /> <edge from-layer="2075" from-port="0" to-layer="2076" to-port="1" /> <edge from-layer="2076" from-port="2" to-layer="2077" to-port="2" /> <edge from-layer="2077" from-port="4" to-layer="2079" to-port="0" /> <edge from-layer="2078" from-port="0" to-layer="2079" to-port="1" /> <edge from-layer="2079" from-port="2" to-layer="2080" to-port="0" /> <edge from-layer="2080" from-port="2" to-layer="2089" to-port="0" /> <edge from-layer="2081" from-port="0" to-layer="2082" to-port="0" /> <edge from-layer="2082" from-port="1" to-layer="2085" to-port="0" /> <edge from-layer="2083" from-port="0" to-layer="2084" to-port="0" /> <edge from-layer="2084" from-port="1" to-layer="2085" to-port="1" /> <edge from-layer="2085" from-port="2" to-layer="2087" to-port="0" /> <edge from-layer="2086" from-port="0" to-layer="2087" to-port="1" /> <edge from-layer="2087" from-port="2" to-layer="2088" to-port="0" /> <edge from-layer="2088" from-port="1" to-layer="2089" to-port="1" /> <edge from-layer="2089" from-port="2" to-layer="2090" to-port="1" /> <edge from-layer="2090" from-port="2" to-layer="2132" to-port="0" /> <edge from-layer="2090" from-port="2" to-layer="2101" to-port="0" /> <edge from-layer="2090" from-port="2" to-layer="2094" to-port="0" /> <edge from-layer="2091" from-port="0" to-layer="2102" to-port="0" /> <edge from-layer="2092" from-port="0" to-layer="2100" to-port="0" /> <edge from-layer="2093" from-port="0" to-layer="2094" to-port="1" /> <edge from-layer="2094" from-port="2" to-layer="2096" to-port="0" /> <edge from-layer="2095" from-port="0" to-layer="2096" to-port="1" /> <edge from-layer="2096" from-port="2" to-layer="2098" to-port="0" /> <edge from-layer="2097" from-port="0" to-layer="2098" to-port="1" /> <edge from-layer="2098" from-port="2" to-layer="2099" to-port="0" /> <edge from-layer="2099" from-port="1" to-layer="2100" to-port="1" /> <edge from-layer="2100" from-port="2" to-layer="2101" to-port="1" /> <edge from-layer="2101" from-port="2" to-layer="2102" to-port="1" /> <edge from-layer="2102" from-port="2" to-layer="2121" to-port="0" /> <edge from-layer="2102" from-port="2" to-layer="2111" to-port="0" /> <edge from-layer="2103" from-port="0" to-layer="2104" to-port="0" /> <edge from-layer="2104" from-port="1" to-layer="2107" to-port="0" /> <edge from-layer="2105" from-port="0" to-layer="2106" to-port="0" /> <edge from-layer="2106" from-port="1" to-layer="2107" to-port="1" /> <edge from-layer="2107" from-port="2" to-layer="2109" to-port="0" /> <edge from-layer="2108" from-port="0" to-layer="2109" to-port="1" /> <edge from-layer="2109" from-port="2" to-layer="2110" to-port="0" /> <edge from-layer="2110" from-port="1" to-layer="2111" to-port="1" /> <edge from-layer="2111" from-port="2" to-layer="2112" to-port="0" /> <edge from-layer="2112" from-port="1" to-layer="2122" to-port="0" /> <edge from-layer="2113" from-port="0" to-layer="2114" to-port="0" /> <edge from-layer="2114" from-port="1" to-layer="2117" to-port="0" /> <edge from-layer="2115" from-port="0" to-layer="2116" to-port="0" /> <edge from-layer="2116" from-port="1" to-layer="2117" to-port="1" /> <edge from-layer="2117" from-port="2" to-layer="2119" to-port="0" /> <edge from-layer="2118" from-port="0" to-layer="2119" to-port="1" /> <edge from-layer="2119" from-port="2" to-layer="2120" to-port="0" /> <edge from-layer="2120" from-port="1" to-layer="2121" to-port="1" /> <edge from-layer="2121" from-port="2" to-layer="2122" to-port="1" /> <edge from-layer="2122" from-port="2" to-layer="2131" to-port="0" /> <edge from-layer="2123" from-port="0" to-layer="2124" to-port="0" /> <edge from-layer="2124" from-port="1" to-layer="2127" to-port="0" /> <edge from-layer="2125" from-port="0" to-layer="2126" to-port="0" /> <edge from-layer="2126" from-port="1" to-layer="2127" to-port="1" /> <edge from-layer="2127" from-port="2" to-layer="2129" to-port="0" /> <edge from-layer="2128" from-port="0" to-layer="2129" to-port="1" /> <edge from-layer="2129" from-port="2" to-layer="2130" to-port="0" /> <edge from-layer="2130" from-port="1" to-layer="2131" to-port="1" /> <edge from-layer="2131" from-port="2" to-layer="2132" to-port="1" /> <edge from-layer="2132" from-port="2" to-layer="2143" to-port="0" /> <edge from-layer="2132" from-port="2" to-layer="2136" to-port="0" /> <edge from-layer="2132" from-port="2" to-layer="2241" to-port="0" /> <edge from-layer="2133" from-port="0" to-layer="2144" to-port="0" /> <edge from-layer="2134" from-port="0" to-layer="2142" to-port="0" /> <edge from-layer="2135" from-port="0" to-layer="2136" to-port="1" /> <edge from-layer="2136" from-port="2" to-layer="2138" to-port="0" /> <edge from-layer="2137" from-port="0" to-layer="2138" to-port="1" /> <edge from-layer="2138" from-port="2" to-layer="2140" to-port="0" /> <edge from-layer="2139" from-port="0" to-layer="2140" to-port="1" /> <edge from-layer="2140" from-port="2" to-layer="2141" to-port="0" /> <edge from-layer="2141" from-port="1" to-layer="2142" to-port="1" /> <edge from-layer="2142" from-port="2" to-layer="2143" to-port="1" /> <edge from-layer="2143" from-port="2" to-layer="2144" to-port="1" /> <edge from-layer="2144" from-port="2" to-layer="2183" to-port="0" /> <edge from-layer="2144" from-port="2" to-layer="2218" to-port="0" /> <edge from-layer="2144" from-port="2" to-layer="2153" to-port="0" /> <edge from-layer="2145" from-port="0" to-layer="2146" to-port="0" /> <edge from-layer="2146" from-port="1" to-layer="2149" to-port="0" /> <edge from-layer="2147" from-port="0" to-layer="2148" to-port="0" /> <edge from-layer="2148" from-port="1" to-layer="2149" to-port="1" /> <edge from-layer="2149" from-port="2" to-layer="2151" to-port="0" /> <edge from-layer="2150" from-port="0" to-layer="2151" to-port="1" /> <edge from-layer="2151" from-port="2" to-layer="2152" to-port="0" /> <edge from-layer="2152" from-port="1" to-layer="2153" to-port="1" /> <edge from-layer="2153" from-port="2" to-layer="2155" to-port="0" /> <edge from-layer="2154" from-port="0" to-layer="2155" to-port="1" /> <edge from-layer="2155" from-port="2" to-layer="2157" to-port="0" /> <edge from-layer="2156" from-port="0" to-layer="2157" to-port="1" /> <edge from-layer="2157" from-port="2" to-layer="2168" to-port="0" /> <edge from-layer="2157" from-port="2" to-layer="2162" to-port="0" /> <edge from-layer="2157" from-port="2" to-layer="2158" to-port="0" /> <edge from-layer="2158" from-port="2" to-layer="2171" to-port="0" /> <edge from-layer="2159" from-port="0" to-layer="2162" to-port="1" /> <edge from-layer="2160" from-port="0" to-layer="2162" to-port="2" /> <edge from-layer="2161" from-port="0" to-layer="2162" to-port="3" /> <edge from-layer="2162" from-port="5" to-layer="2164" to-port="0" /> <edge from-layer="2163" from-port="0" to-layer="2164" to-port="1" /> <edge from-layer="2164" from-port="2" to-layer="2169" to-port="0" /> <edge from-layer="2165" from-port="0" to-layer="2168" to-port="1" /> <edge from-layer="2166" from-port="0" to-layer="2168" to-port="2" /> <edge from-layer="2167" from-port="0" to-layer="2168" to-port="3" /> <edge from-layer="2168" from-port="5" to-layer="2169" to-port="1" /> <edge from-layer="2169" from-port="2" to-layer="2170" to-port="0" /> <edge from-layer="2170" from-port="2" to-layer="2171" to-port="1" /> <edge from-layer="2171" from-port="2" to-layer="2228" to-port="0" /> <edge from-layer="2172" from-port="1" to-layer="2174" to-port="0" /> <edge from-layer="2173" from-port="0" to-layer="2174" to-port="2" /> <edge from-layer="2174" from-port="3" to-layer="2202" to-port="0" /> <edge from-layer="2175" from-port="0" to-layer="2176" to-port="0" /> <edge from-layer="2176" from-port="1" to-layer="2179" to-port="0" /> <edge from-layer="2177" from-port="0" to-layer="2178" to-port="0" /> <edge from-layer="2178" from-port="1" to-layer="2179" to-port="1" /> <edge from-layer="2179" from-port="2" to-layer="2181" to-port="0" /> <edge from-layer="2180" from-port="0" to-layer="2181" to-port="1" /> <edge from-layer="2181" from-port="2" to-layer="2182" to-port="0" /> <edge from-layer="2182" from-port="1" to-layer="2183" to-port="1" /> <edge from-layer="2183" from-port="2" to-layer="2185" to-port="0" /> <edge from-layer="2184" from-port="0" to-layer="2185" to-port="1" /> <edge from-layer="2185" from-port="2" to-layer="2187" to-port="0" /> <edge from-layer="2186" from-port="0" to-layer="2187" to-port="1" /> <edge from-layer="2187" from-port="2" to-layer="2188" to-port="0" /> <edge from-layer="2187" from-port="2" to-layer="2192" to-port="0" /> <edge from-layer="2187" from-port="2" to-layer="2198" to-port="0" /> <edge from-layer="2188" from-port="2" to-layer="2201" to-port="0" /> <edge from-layer="2189" from-port="0" to-layer="2192" to-port="1" /> <edge from-layer="2190" from-port="0" to-layer="2192" to-port="2" /> <edge from-layer="2191" from-port="0" to-layer="2192" to-port="3" /> <edge from-layer="2192" from-port="5" to-layer="2194" to-port="0" /> <edge from-layer="2193" from-port="0" to-layer="2194" to-port="1" /> <edge from-layer="2194" from-port="2" to-layer="2199" to-port="0" /> <edge from-layer="2195" from-port="0" to-layer="2198" to-port="1" /> <edge from-layer="2196" from-port="0" to-layer="2198" to-port="2" /> <edge from-layer="2197" from-port="0" to-layer="2198" to-port="3" /> <edge from-layer="2198" from-port="5" to-layer="2199" to-port="1" /> <edge from-layer="2199" from-port="2" to-layer="2200" to-port="0" /> <edge from-layer="2200" from-port="2" to-layer="2201" to-port="1" /> <edge from-layer="2201" from-port="2" to-layer="2202" to-port="1" /> <edge from-layer="2202" from-port="2" to-layer="6172" to-port="0" /> <edge from-layer="2202" from-port="2" to-layer="2203" to-port="0" /> <edge from-layer="2203" from-port="2" to-layer="2204" to-port="0" /> <edge from-layer="2204" from-port="2" to-layer="2206" to-port="0" /> <edge from-layer="2205" from-port="0" to-layer="2206" to-port="1" /> <edge from-layer="2206" from-port="2" to-layer="2228" to-port="1" /> <edge from-layer="2207" from-port="1" to-layer="2209" to-port="0" /> <edge from-layer="2208" from-port="0" to-layer="2209" to-port="2" /> <edge from-layer="2209" from-port="3" to-layer="2223" to-port="0" /> <edge from-layer="2210" from-port="0" to-layer="2211" to-port="0" /> <edge from-layer="2211" from-port="1" to-layer="2214" to-port="0" /> <edge from-layer="2212" from-port="0" to-layer="2213" to-port="0" /> <edge from-layer="2213" from-port="1" to-layer="2214" to-port="1" /> <edge from-layer="2214" from-port="2" to-layer="2216" to-port="0" /> <edge from-layer="2215" from-port="0" to-layer="2216" to-port="1" /> <edge from-layer="2216" from-port="2" to-layer="2217" to-port="0" /> <edge from-layer="2217" from-port="1" to-layer="2218" to-port="1" /> <edge from-layer="2218" from-port="2" to-layer="2220" to-port="0" /> <edge from-layer="2219" from-port="0" to-layer="2220" to-port="1" /> <edge from-layer="2220" from-port="2" to-layer="2222" to-port="0" /> <edge from-layer="2221" from-port="0" to-layer="2222" to-port="1" /> <edge from-layer="2222" from-port="2" to-layer="2223" to-port="1" /> <edge from-layer="2223" from-port="2" to-layer="6171" to-port="0" /> <edge from-layer="2223" from-port="2" to-layer="2224" to-port="0" /> <edge from-layer="2224" from-port="2" to-layer="2225" to-port="0" /> <edge from-layer="2225" from-port="2" to-layer="2227" to-port="0" /> <edge from-layer="2226" from-port="0" to-layer="2227" to-port="1" /> <edge from-layer="2227" from-port="2" to-layer="2228" to-port="2" /> <edge from-layer="2228" from-port="4" to-layer="2230" to-port="0" /> <edge from-layer="2229" from-port="0" to-layer="2230" to-port="1" /> <edge from-layer="2230" from-port="2" to-layer="2231" to-port="0" /> <edge from-layer="2231" from-port="2" to-layer="2240" to-port="0" /> <edge from-layer="2232" from-port="0" to-layer="2233" to-port="0" /> <edge from-layer="2233" from-port="1" to-layer="2236" to-port="0" /> <edge from-layer="2234" from-port="0" to-layer="2235" to-port="0" /> <edge from-layer="2235" from-port="1" to-layer="2236" to-port="1" /> <edge from-layer="2236" from-port="2" to-layer="2238" to-port="0" /> <edge from-layer="2237" from-port="0" to-layer="2238" to-port="1" /> <edge from-layer="2238" from-port="2" to-layer="2239" to-port="0" /> <edge from-layer="2239" from-port="1" to-layer="2240" to-port="1" /> <edge from-layer="2240" from-port="2" to-layer="2241" to-port="1" /> <edge from-layer="2241" from-port="2" to-layer="2245" to-port="0" /> <edge from-layer="2241" from-port="2" to-layer="2252" to-port="0" /> <edge from-layer="2241" from-port="2" to-layer="2283" to-port="0" /> <edge from-layer="2242" from-port="0" to-layer="2253" to-port="0" /> <edge from-layer="2243" from-port="0" to-layer="2251" to-port="0" /> <edge from-layer="2244" from-port="0" to-layer="2245" to-port="1" /> <edge from-layer="2245" from-port="2" to-layer="2247" to-port="0" /> <edge from-layer="2246" from-port="0" to-layer="2247" to-port="1" /> <edge from-layer="2247" from-port="2" to-layer="2249" to-port="0" /> <edge from-layer="2248" from-port="0" to-layer="2249" to-port="1" /> <edge from-layer="2249" from-port="2" to-layer="2250" to-port="0" /> <edge from-layer="2250" from-port="1" to-layer="2251" to-port="1" /> <edge from-layer="2251" from-port="2" to-layer="2252" to-port="1" /> <edge from-layer="2252" from-port="2" to-layer="2253" to-port="1" /> <edge from-layer="2253" from-port="2" to-layer="2262" to-port="0" /> <edge from-layer="2253" from-port="2" to-layer="2272" to-port="0" /> <edge from-layer="2254" from-port="0" to-layer="2255" to-port="0" /> <edge from-layer="2255" from-port="1" to-layer="2258" to-port="0" /> <edge from-layer="2256" from-port="0" to-layer="2257" to-port="0" /> <edge from-layer="2257" from-port="1" to-layer="2258" to-port="1" /> <edge from-layer="2258" from-port="2" to-layer="2260" to-port="0" /> <edge from-layer="2259" from-port="0" to-layer="2260" to-port="1" /> <edge from-layer="2260" from-port="2" to-layer="2261" to-port="0" /> <edge from-layer="2261" from-port="1" to-layer="2262" to-port="1" /> <edge from-layer="2262" from-port="2" to-layer="2263" to-port="0" /> <edge from-layer="2263" from-port="1" to-layer="2273" to-port="0" /> <edge from-layer="2264" from-port="0" to-layer="2265" to-port="0" /> <edge from-layer="2265" from-port="1" to-layer="2268" to-port="0" /> <edge from-layer="2266" from-port="0" to-layer="2267" to-port="0" /> <edge from-layer="2267" from-port="1" to-layer="2268" to-port="1" /> <edge from-layer="2268" from-port="2" to-layer="2270" to-port="0" /> <edge from-layer="2269" from-port="0" to-layer="2270" to-port="1" /> <edge from-layer="2270" from-port="2" to-layer="2271" to-port="0" /> <edge from-layer="2271" from-port="1" to-layer="2272" to-port="1" /> <edge from-layer="2272" from-port="2" to-layer="2273" to-port="1" /> <edge from-layer="2273" from-port="2" to-layer="2282" to-port="0" /> <edge from-layer="2274" from-port="0" to-layer="2275" to-port="0" /> <edge from-layer="2275" from-port="1" to-layer="2278" to-port="0" /> <edge from-layer="2276" from-port="0" to-layer="2277" to-port="0" /> <edge from-layer="2277" from-port="1" to-layer="2278" to-port="1" /> <edge from-layer="2278" from-port="2" to-layer="2280" to-port="0" /> <edge from-layer="2279" from-port="0" to-layer="2280" to-port="1" /> <edge from-layer="2280" from-port="2" to-layer="2281" to-port="0" /> <edge from-layer="2281" from-port="1" to-layer="2282" to-port="1" /> <edge from-layer="2282" from-port="2" to-layer="2283" to-port="1" /> <edge from-layer="2283" from-port="2" to-layer="2392" to-port="0" /> <edge from-layer="2283" from-port="2" to-layer="2294" to-port="0" /> <edge from-layer="2283" from-port="2" to-layer="2287" to-port="0" /> <edge from-layer="2284" from-port="0" to-layer="2295" to-port="0" /> <edge from-layer="2285" from-port="0" to-layer="2293" to-port="0" /> <edge from-layer="2286" from-port="0" to-layer="2287" to-port="1" /> <edge from-layer="2287" from-port="2" to-layer="2289" to-port="0" /> <edge from-layer="2288" from-port="0" to-layer="2289" to-port="1" /> <edge from-layer="2289" from-port="2" to-layer="2291" to-port="0" /> <edge from-layer="2290" from-port="0" to-layer="2291" to-port="1" /> <edge from-layer="2291" from-port="2" to-layer="2292" to-port="0" /> <edge from-layer="2292" from-port="1" to-layer="2293" to-port="1" /> <edge from-layer="2293" from-port="2" to-layer="2294" to-port="1" /> <edge from-layer="2294" from-port="2" to-layer="2295" to-port="1" /> <edge from-layer="2295" from-port="2" to-layer="2334" to-port="0" /> <edge from-layer="2295" from-port="2" to-layer="2369" to-port="0" /> <edge from-layer="2295" from-port="2" to-layer="2304" to-port="0" /> <edge from-layer="2296" from-port="0" to-layer="2297" to-port="0" /> <edge from-layer="2297" from-port="1" to-layer="2300" to-port="0" /> <edge from-layer="2298" from-port="0" to-layer="2299" to-port="0" /> <edge from-layer="2299" from-port="1" to-layer="2300" to-port="1" /> <edge from-layer="2300" from-port="2" to-layer="2302" to-port="0" /> <edge from-layer="2301" from-port="0" to-layer="2302" to-port="1" /> <edge from-layer="2302" from-port="2" to-layer="2303" to-port="0" /> <edge from-layer="2303" from-port="1" to-layer="2304" to-port="1" /> <edge from-layer="2304" from-port="2" to-layer="2306" to-port="0" /> <edge from-layer="2305" from-port="0" to-layer="2306" to-port="1" /> <edge from-layer="2306" from-port="2" to-layer="2308" to-port="0" /> <edge from-layer="2307" from-port="0" to-layer="2308" to-port="1" /> <edge from-layer="2308" from-port="2" to-layer="2309" to-port="0" /> <edge from-layer="2308" from-port="2" to-layer="2313" to-port="0" /> <edge from-layer="2308" from-port="2" to-layer="2319" to-port="0" /> <edge from-layer="2309" from-port="2" to-layer="2322" to-port="0" /> <edge from-layer="2310" from-port="0" to-layer="2313" to-port="1" /> <edge from-layer="2311" from-port="0" to-layer="2313" to-port="2" /> <edge from-layer="2312" from-port="0" to-layer="2313" to-port="3" /> <edge from-layer="2313" from-port="5" to-layer="2315" to-port="0" /> <edge from-layer="2314" from-port="0" to-layer="2315" to-port="1" /> <edge from-layer="2315" from-port="2" to-layer="2320" to-port="0" /> <edge from-layer="2316" from-port="0" to-layer="2319" to-port="1" /> <edge from-layer="2317" from-port="0" to-layer="2319" to-port="2" /> <edge from-layer="2318" from-port="0" to-layer="2319" to-port="3" /> <edge from-layer="2319" from-port="5" to-layer="2320" to-port="1" /> <edge from-layer="2320" from-port="2" to-layer="2321" to-port="0" /> <edge from-layer="2321" from-port="2" to-layer="2322" to-port="1" /> <edge from-layer="2322" from-port="2" to-layer="2379" to-port="0" /> <edge from-layer="2323" from-port="1" to-layer="2325" to-port="0" /> <edge from-layer="2324" from-port="0" to-layer="2325" to-port="2" /> <edge from-layer="2325" from-port="3" to-layer="2353" to-port="0" /> <edge from-layer="2326" from-port="0" to-layer="2327" to-port="0" /> <edge from-layer="2327" from-port="1" to-layer="2330" to-port="0" /> <edge from-layer="2328" from-port="0" to-layer="2329" to-port="0" /> <edge from-layer="2329" from-port="1" to-layer="2330" to-port="1" /> <edge from-layer="2330" from-port="2" to-layer="2332" to-port="0" /> <edge from-layer="2331" from-port="0" to-layer="2332" to-port="1" /> <edge from-layer="2332" from-port="2" to-layer="2333" to-port="0" /> <edge from-layer="2333" from-port="1" to-layer="2334" to-port="1" /> <edge from-layer="2334" from-port="2" to-layer="2336" to-port="0" /> <edge from-layer="2335" from-port="0" to-layer="2336" to-port="1" /> <edge from-layer="2336" from-port="2" to-layer="2338" to-port="0" /> <edge from-layer="2337" from-port="0" to-layer="2338" to-port="1" /> <edge from-layer="2338" from-port="2" to-layer="2339" to-port="0" /> <edge from-layer="2338" from-port="2" to-layer="2343" to-port="0" /> <edge from-layer="2338" from-port="2" to-layer="2349" to-port="0" /> <edge from-layer="2339" from-port="2" to-layer="2352" to-port="0" /> <edge from-layer="2340" from-port="0" to-layer="2343" to-port="1" /> <edge from-layer="2341" from-port="0" to-layer="2343" to-port="2" /> <edge from-layer="2342" from-port="0" to-layer="2343" to-port="3" /> <edge from-layer="2343" from-port="5" to-layer="2345" to-port="0" /> <edge from-layer="2344" from-port="0" to-layer="2345" to-port="1" /> <edge from-layer="2345" from-port="2" to-layer="2350" to-port="0" /> <edge from-layer="2346" from-port="0" to-layer="2349" to-port="1" /> <edge from-layer="2347" from-port="0" to-layer="2349" to-port="2" /> <edge from-layer="2348" from-port="0" to-layer="2349" to-port="3" /> <edge from-layer="2349" from-port="5" to-layer="2350" to-port="1" /> <edge from-layer="2350" from-port="2" to-layer="2351" to-port="0" /> <edge from-layer="2351" from-port="2" to-layer="2352" to-port="1" /> <edge from-layer="2352" from-port="2" to-layer="2353" to-port="1" /> <edge from-layer="2353" from-port="2" to-layer="6170" to-port="0" /> <edge from-layer="2353" from-port="2" to-layer="2354" to-port="0" /> <edge from-layer="2354" from-port="2" to-layer="2355" to-port="0" /> <edge from-layer="2355" from-port="2" to-layer="2357" to-port="0" /> <edge from-layer="2356" from-port="0" to-layer="2357" to-port="1" /> <edge from-layer="2357" from-port="2" to-layer="2379" to-port="1" /> <edge from-layer="2358" from-port="1" to-layer="2360" to-port="0" /> <edge from-layer="2359" from-port="0" to-layer="2360" to-port="2" /> <edge from-layer="2360" from-port="3" to-layer="2374" to-port="0" /> <edge from-layer="2361" from-port="0" to-layer="2362" to-port="0" /> <edge from-layer="2362" from-port="1" to-layer="2365" to-port="0" /> <edge from-layer="2363" from-port="0" to-layer="2364" to-port="0" /> <edge from-layer="2364" from-port="1" to-layer="2365" to-port="1" /> <edge from-layer="2365" from-port="2" to-layer="2367" to-port="0" /> <edge from-layer="2366" from-port="0" to-layer="2367" to-port="1" /> <edge from-layer="2367" from-port="2" to-layer="2368" to-port="0" /> <edge from-layer="2368" from-port="1" to-layer="2369" to-port="1" /> <edge from-layer="2369" from-port="2" to-layer="2371" to-port="0" /> <edge from-layer="2370" from-port="0" to-layer="2371" to-port="1" /> <edge from-layer="2371" from-port="2" to-layer="2373" to-port="0" /> <edge from-layer="2372" from-port="0" to-layer="2373" to-port="1" /> <edge from-layer="2373" from-port="2" to-layer="2374" to-port="1" /> <edge from-layer="2374" from-port="2" to-layer="2375" to-port="0" /> <edge from-layer="2374" from-port="2" to-layer="6169" to-port="0" /> <edge from-layer="2375" from-port="2" to-layer="2376" to-port="0" /> <edge from-layer="2376" from-port="2" to-layer="2378" to-port="0" /> <edge from-layer="2377" from-port="0" to-layer="2378" to-port="1" /> <edge from-layer="2378" from-port="2" to-layer="2379" to-port="2" /> <edge from-layer="2379" from-port="4" to-layer="2381" to-port="0" /> <edge from-layer="2380" from-port="0" to-layer="2381" to-port="1" /> <edge from-layer="2381" from-port="2" to-layer="2382" to-port="0" /> <edge from-layer="2382" from-port="2" to-layer="2391" to-port="0" /> <edge from-layer="2383" from-port="0" to-layer="2384" to-port="0" /> <edge from-layer="2384" from-port="1" to-layer="2387" to-port="0" /> <edge from-layer="2385" from-port="0" to-layer="2386" to-port="0" /> <edge from-layer="2386" from-port="1" to-layer="2387" to-port="1" /> <edge from-layer="2387" from-port="2" to-layer="2389" to-port="0" /> <edge from-layer="2388" from-port="0" to-layer="2389" to-port="1" /> <edge from-layer="2389" from-port="2" to-layer="2390" to-port="0" /> <edge from-layer="2390" from-port="1" to-layer="2391" to-port="1" /> <edge from-layer="2391" from-port="2" to-layer="2392" to-port="1" /> <edge from-layer="2392" from-port="2" to-layer="2434" to-port="0" /> <edge from-layer="2392" from-port="2" to-layer="2403" to-port="0" /> <edge from-layer="2392" from-port="2" to-layer="2396" to-port="0" /> <edge from-layer="2393" from-port="0" to-layer="2404" to-port="0" /> <edge from-layer="2394" from-port="0" to-layer="2402" to-port="0" /> <edge from-layer="2395" from-port="0" to-layer="2396" to-port="1" /> <edge from-layer="2396" from-port="2" to-layer="2398" to-port="0" /> <edge from-layer="2397" from-port="0" to-layer="2398" to-port="1" /> <edge from-layer="2398" from-port="2" to-layer="2400" to-port="0" /> <edge from-layer="2399" from-port="0" to-layer="2400" to-port="1" /> <edge from-layer="2400" from-port="2" to-layer="2401" to-port="0" /> <edge from-layer="2401" from-port="1" to-layer="2402" to-port="1" /> <edge from-layer="2402" from-port="2" to-layer="2403" to-port="1" /> <edge from-layer="2403" from-port="2" to-layer="2404" to-port="1" /> <edge from-layer="2404" from-port="2" to-layer="2423" to-port="0" /> <edge from-layer="2404" from-port="2" to-layer="2413" to-port="0" /> <edge from-layer="2405" from-port="0" to-layer="2406" to-port="0" /> <edge from-layer="2406" from-port="1" to-layer="2409" to-port="0" /> <edge from-layer="2407" from-port="0" to-layer="2408" to-port="0" /> <edge from-layer="2408" from-port="1" to-layer="2409" to-port="1" /> <edge from-layer="2409" from-port="2" to-layer="2411" to-port="0" /> <edge from-layer="2410" from-port="0" to-layer="2411" to-port="1" /> <edge from-layer="2411" from-port="2" to-layer="2412" to-port="0" /> <edge from-layer="2412" from-port="1" to-layer="2413" to-port="1" /> <edge from-layer="2413" from-port="2" to-layer="2414" to-port="0" /> <edge from-layer="2414" from-port="1" to-layer="2424" to-port="0" /> <edge from-layer="2415" from-port="0" to-layer="2416" to-port="0" /> <edge from-layer="2416" from-port="1" to-layer="2419" to-port="0" /> <edge from-layer="2417" from-port="0" to-layer="2418" to-port="0" /> <edge from-layer="2418" from-port="1" to-layer="2419" to-port="1" /> <edge from-layer="2419" from-port="2" to-layer="2421" to-port="0" /> <edge from-layer="2420" from-port="0" to-layer="2421" to-port="1" /> <edge from-layer="2421" from-port="2" to-layer="2422" to-port="0" /> <edge from-layer="2422" from-port="1" to-layer="2423" to-port="1" /> <edge from-layer="2423" from-port="2" to-layer="2424" to-port="1" /> <edge from-layer="2424" from-port="2" to-layer="2433" to-port="0" /> <edge from-layer="2425" from-port="0" to-layer="2426" to-port="0" /> <edge from-layer="2426" from-port="1" to-layer="2429" to-port="0" /> <edge from-layer="2427" from-port="0" to-layer="2428" to-port="0" /> <edge from-layer="2428" from-port="1" to-layer="2429" to-port="1" /> <edge from-layer="2429" from-port="2" to-layer="2431" to-port="0" /> <edge from-layer="2430" from-port="0" to-layer="2431" to-port="1" /> <edge from-layer="2431" from-port="2" to-layer="2432" to-port="0" /> <edge from-layer="2432" from-port="1" to-layer="2433" to-port="1" /> <edge from-layer="2433" from-port="2" to-layer="2434" to-port="1" /> <edge from-layer="2434" from-port="2" to-layer="2438" to-port="0" /> <edge from-layer="2434" from-port="2" to-layer="2543" to-port="0" /> <edge from-layer="2434" from-port="2" to-layer="2445" to-port="0" /> <edge from-layer="2435" from-port="0" to-layer="2446" to-port="0" /> <edge from-layer="2436" from-port="0" to-layer="2444" to-port="0" /> <edge from-layer="2437" from-port="0" to-layer="2438" to-port="1" /> <edge from-layer="2438" from-port="2" to-layer="2440" to-port="0" /> <edge from-layer="2439" from-port="0" to-layer="2440" to-port="1" /> <edge from-layer="2440" from-port="2" to-layer="2442" to-port="0" /> <edge from-layer="2441" from-port="0" to-layer="2442" to-port="1" /> <edge from-layer="2442" from-port="2" to-layer="2443" to-port="0" /> <edge from-layer="2443" from-port="1" to-layer="2444" to-port="1" /> <edge from-layer="2444" from-port="2" to-layer="2445" to-port="1" /> <edge from-layer="2445" from-port="2" to-layer="2446" to-port="1" /> <edge from-layer="2446" from-port="2" to-layer="2520" to-port="0" /> <edge from-layer="2446" from-port="2" to-layer="2455" to-port="0" /> <edge from-layer="2446" from-port="2" to-layer="2485" to-port="0" /> <edge from-layer="2447" from-port="0" to-layer="2448" to-port="0" /> <edge from-layer="2448" from-port="1" to-layer="2451" to-port="0" /> <edge from-layer="2449" from-port="0" to-layer="2450" to-port="0" /> <edge from-layer="2450" from-port="1" to-layer="2451" to-port="1" /> <edge from-layer="2451" from-port="2" to-layer="2453" to-port="0" /> <edge from-layer="2452" from-port="0" to-layer="2453" to-port="1" /> <edge from-layer="2453" from-port="2" to-layer="2454" to-port="0" /> <edge from-layer="2454" from-port="1" to-layer="2455" to-port="1" /> <edge from-layer="2455" from-port="2" to-layer="2457" to-port="0" /> <edge from-layer="2456" from-port="0" to-layer="2457" to-port="1" /> <edge from-layer="2457" from-port="2" to-layer="2459" to-port="0" /> <edge from-layer="2458" from-port="0" to-layer="2459" to-port="1" /> <edge from-layer="2459" from-port="2" to-layer="2470" to-port="0" /> <edge from-layer="2459" from-port="2" to-layer="2464" to-port="0" /> <edge from-layer="2459" from-port="2" to-layer="2460" to-port="0" /> <edge from-layer="2460" from-port="2" to-layer="2473" to-port="0" /> <edge from-layer="2461" from-port="0" to-layer="2464" to-port="1" /> <edge from-layer="2462" from-port="0" to-layer="2464" to-port="2" /> <edge from-layer="2463" from-port="0" to-layer="2464" to-port="3" /> <edge from-layer="2464" from-port="5" to-layer="2466" to-port="0" /> <edge from-layer="2465" from-port="0" to-layer="2466" to-port="1" /> <edge from-layer="2466" from-port="2" to-layer="2471" to-port="0" /> <edge from-layer="2467" from-port="0" to-layer="2470" to-port="1" /> <edge from-layer="2468" from-port="0" to-layer="2470" to-port="2" /> <edge from-layer="2469" from-port="0" to-layer="2470" to-port="3" /> <edge from-layer="2470" from-port="5" to-layer="2471" to-port="1" /> <edge from-layer="2471" from-port="2" to-layer="2472" to-port="0" /> <edge from-layer="2472" from-port="2" to-layer="2473" to-port="1" /> <edge from-layer="2473" from-port="2" to-layer="2530" to-port="0" /> <edge from-layer="2474" from-port="1" to-layer="2476" to-port="0" /> <edge from-layer="2475" from-port="0" to-layer="2476" to-port="2" /> <edge from-layer="2476" from-port="3" to-layer="2504" to-port="0" /> <edge from-layer="2477" from-port="0" to-layer="2478" to-port="0" /> <edge from-layer="2478" from-port="1" to-layer="2481" to-port="0" /> <edge from-layer="2479" from-port="0" to-layer="2480" to-port="0" /> <edge from-layer="2480" from-port="1" to-layer="2481" to-port="1" /> <edge from-layer="2481" from-port="2" to-layer="2483" to-port="0" /> <edge from-layer="2482" from-port="0" to-layer="2483" to-port="1" /> <edge from-layer="2483" from-port="2" to-layer="2484" to-port="0" /> <edge from-layer="2484" from-port="1" to-layer="2485" to-port="1" /> <edge from-layer="2485" from-port="2" to-layer="2487" to-port="0" /> <edge from-layer="2486" from-port="0" to-layer="2487" to-port="1" /> <edge from-layer="2487" from-port="2" to-layer="2489" to-port="0" /> <edge from-layer="2488" from-port="0" to-layer="2489" to-port="1" /> <edge from-layer="2489" from-port="2" to-layer="2500" to-port="0" /> <edge from-layer="2489" from-port="2" to-layer="2490" to-port="0" /> <edge from-layer="2489" from-port="2" to-layer="2494" to-port="0" /> <edge from-layer="2490" from-port="2" to-layer="2503" to-port="0" /> <edge from-layer="2491" from-port="0" to-layer="2494" to-port="1" /> <edge from-layer="2492" from-port="0" to-layer="2494" to-port="2" /> <edge from-layer="2493" from-port="0" to-layer="2494" to-port="3" /> <edge from-layer="2494" from-port="5" to-layer="2496" to-port="0" /> <edge from-layer="2495" from-port="0" to-layer="2496" to-port="1" /> <edge from-layer="2496" from-port="2" to-layer="2501" to-port="0" /> <edge from-layer="2497" from-port="0" to-layer="2500" to-port="1" /> <edge from-layer="2498" from-port="0" to-layer="2500" to-port="2" /> <edge from-layer="2499" from-port="0" to-layer="2500" to-port="3" /> <edge from-layer="2500" from-port="5" to-layer="2501" to-port="1" /> <edge from-layer="2501" from-port="2" to-layer="2502" to-port="0" /> <edge from-layer="2502" from-port="2" to-layer="2503" to-port="1" /> <edge from-layer="2503" from-port="2" to-layer="2504" to-port="1" /> <edge from-layer="2504" from-port="2" to-layer="6168" to-port="0" /> <edge from-layer="2504" from-port="2" to-layer="2505" to-port="0" /> <edge from-layer="2505" from-port="2" to-layer="2506" to-port="0" /> <edge from-layer="2506" from-port="2" to-layer="2508" to-port="0" /> <edge from-layer="2507" from-port="0" to-layer="2508" to-port="1" /> <edge from-layer="2508" from-port="2" to-layer="2530" to-port="1" /> <edge from-layer="2509" from-port="1" to-layer="2511" to-port="0" /> <edge from-layer="2510" from-port="0" to-layer="2511" to-port="2" /> <edge from-layer="2511" from-port="3" to-layer="2525" to-port="0" /> <edge from-layer="2512" from-port="0" to-layer="2513" to-port="0" /> <edge from-layer="2513" from-port="1" to-layer="2516" to-port="0" /> <edge from-layer="2514" from-port="0" to-layer="2515" to-port="0" /> <edge from-layer="2515" from-port="1" to-layer="2516" to-port="1" /> <edge from-layer="2516" from-port="2" to-layer="2518" to-port="0" /> <edge from-layer="2517" from-port="0" to-layer="2518" to-port="1" /> <edge from-layer="2518" from-port="2" to-layer="2519" to-port="0" /> <edge from-layer="2519" from-port="1" to-layer="2520" to-port="1" /> <edge from-layer="2520" from-port="2" to-layer="2522" to-port="0" /> <edge from-layer="2521" from-port="0" to-layer="2522" to-port="1" /> <edge from-layer="2522" from-port="2" to-layer="2524" to-port="0" /> <edge from-layer="2523" from-port="0" to-layer="2524" to-port="1" /> <edge from-layer="2524" from-port="2" to-layer="2525" to-port="1" /> <edge from-layer="2525" from-port="2" to-layer="2526" to-port="0" /> <edge from-layer="2525" from-port="2" to-layer="6167" to-port="0" /> <edge from-layer="2526" from-port="2" to-layer="2527" to-port="0" /> <edge from-layer="2527" from-port="2" to-layer="2529" to-port="0" /> <edge from-layer="2528" from-port="0" to-layer="2529" to-port="1" /> <edge from-layer="2529" from-port="2" to-layer="2530" to-port="2" /> <edge from-layer="2530" from-port="4" to-layer="2532" to-port="0" /> <edge from-layer="2531" from-port="0" to-layer="2532" to-port="1" /> <edge from-layer="2532" from-port="2" to-layer="2533" to-port="0" /> <edge from-layer="2533" from-port="2" to-layer="2542" to-port="0" /> <edge from-layer="2534" from-port="0" to-layer="2535" to-port="0" /> <edge from-layer="2535" from-port="1" to-layer="2538" to-port="0" /> <edge from-layer="2536" from-port="0" to-layer="2537" to-port="0" /> <edge from-layer="2537" from-port="1" to-layer="2538" to-port="1" /> <edge from-layer="2538" from-port="2" to-layer="2540" to-port="0" /> <edge from-layer="2539" from-port="0" to-layer="2540" to-port="1" /> <edge from-layer="2540" from-port="2" to-layer="2541" to-port="0" /> <edge from-layer="2541" from-port="1" to-layer="2542" to-port="1" /> <edge from-layer="2542" from-port="2" to-layer="2543" to-port="1" /> <edge from-layer="2543" from-port="2" to-layer="2547" to-port="0" /> <edge from-layer="2543" from-port="2" to-layer="2585" to-port="0" /> <edge from-layer="2543" from-port="2" to-layer="2554" to-port="0" /> <edge from-layer="2544" from-port="0" to-layer="2555" to-port="0" /> <edge from-layer="2545" from-port="0" to-layer="2553" to-port="0" /> <edge from-layer="2546" from-port="0" to-layer="2547" to-port="1" /> <edge from-layer="2547" from-port="2" to-layer="2549" to-port="0" /> <edge from-layer="2548" from-port="0" to-layer="2549" to-port="1" /> <edge from-layer="2549" from-port="2" to-layer="2551" to-port="0" /> <edge from-layer="2550" from-port="0" to-layer="2551" to-port="1" /> <edge from-layer="2551" from-port="2" to-layer="2552" to-port="0" /> <edge from-layer="2552" from-port="1" to-layer="2553" to-port="1" /> <edge from-layer="2553" from-port="2" to-layer="2554" to-port="1" /> <edge from-layer="2554" from-port="2" to-layer="2555" to-port="1" /> <edge from-layer="2555" from-port="2" to-layer="2574" to-port="0" /> <edge from-layer="2555" from-port="2" to-layer="2564" to-port="0" /> <edge from-layer="2556" from-port="0" to-layer="2557" to-port="0" /> <edge from-layer="2557" from-port="1" to-layer="2560" to-port="0" /> <edge from-layer="2558" from-port="0" to-layer="2559" to-port="0" /> <edge from-layer="2559" from-port="1" to-layer="2560" to-port="1" /> <edge from-layer="2560" from-port="2" to-layer="2562" to-port="0" /> <edge from-layer="2561" from-port="0" to-layer="2562" to-port="1" /> <edge from-layer="2562" from-port="2" to-layer="2563" to-port="0" /> <edge from-layer="2563" from-port="1" to-layer="2564" to-port="1" /> <edge from-layer="2564" from-port="2" to-layer="2565" to-port="0" /> <edge from-layer="2565" from-port="1" to-layer="2575" to-port="0" /> <edge from-layer="2566" from-port="0" to-layer="2567" to-port="0" /> <edge from-layer="2567" from-port="1" to-layer="2570" to-port="0" /> <edge from-layer="2568" from-port="0" to-layer="2569" to-port="0" /> <edge from-layer="2569" from-port="1" to-layer="2570" to-port="1" /> <edge from-layer="2570" from-port="2" to-layer="2572" to-port="0" /> <edge from-layer="2571" from-port="0" to-layer="2572" to-port="1" /> <edge from-layer="2572" from-port="2" to-layer="2573" to-port="0" /> <edge from-layer="2573" from-port="1" to-layer="2574" to-port="1" /> <edge from-layer="2574" from-port="2" to-layer="2575" to-port="1" /> <edge from-layer="2575" from-port="2" to-layer="2584" to-port="0" /> <edge from-layer="2576" from-port="0" to-layer="2577" to-port="0" /> <edge from-layer="2577" from-port="1" to-layer="2580" to-port="0" /> <edge from-layer="2578" from-port="0" to-layer="2579" to-port="0" /> <edge from-layer="2579" from-port="1" to-layer="2580" to-port="1" /> <edge from-layer="2580" from-port="2" to-layer="2582" to-port="0" /> <edge from-layer="2581" from-port="0" to-layer="2582" to-port="1" /> <edge from-layer="2582" from-port="2" to-layer="2583" to-port="0" /> <edge from-layer="2583" from-port="1" to-layer="2584" to-port="1" /> <edge from-layer="2584" from-port="2" to-layer="2585" to-port="1" /> <edge from-layer="2585" from-port="2" to-layer="2589" to-port="0" /> <edge from-layer="2585" from-port="2" to-layer="2694" to-port="0" /> <edge from-layer="2585" from-port="2" to-layer="2596" to-port="0" /> <edge from-layer="2586" from-port="0" to-layer="2597" to-port="0" /> <edge from-layer="2587" from-port="0" to-layer="2595" to-port="0" /> <edge from-layer="2588" from-port="0" to-layer="2589" to-port="1" /> <edge from-layer="2589" from-port="2" to-layer="2591" to-port="0" /> <edge from-layer="2590" from-port="0" to-layer="2591" to-port="1" /> <edge from-layer="2591" from-port="2" to-layer="2593" to-port="0" /> <edge from-layer="2592" from-port="0" to-layer="2593" to-port="1" /> <edge from-layer="2593" from-port="2" to-layer="2594" to-port="0" /> <edge from-layer="2594" from-port="1" to-layer="2595" to-port="1" /> <edge from-layer="2595" from-port="2" to-layer="2596" to-port="1" /> <edge from-layer="2596" from-port="2" to-layer="2597" to-port="1" /> <edge from-layer="2597" from-port="2" to-layer="2671" to-port="0" /> <edge from-layer="2597" from-port="2" to-layer="2636" to-port="0" /> <edge from-layer="2597" from-port="2" to-layer="2606" to-port="0" /> <edge from-layer="2598" from-port="0" to-layer="2599" to-port="0" /> <edge from-layer="2599" from-port="1" to-layer="2602" to-port="0" /> <edge from-layer="2600" from-port="0" to-layer="2601" to-port="0" /> <edge from-layer="2601" from-port="1" to-layer="2602" to-port="1" /> <edge from-layer="2602" from-port="2" to-layer="2604" to-port="0" /> <edge from-layer="2603" from-port="0" to-layer="2604" to-port="1" /> <edge from-layer="2604" from-port="2" to-layer="2605" to-port="0" /> <edge from-layer="2605" from-port="1" to-layer="2606" to-port="1" /> <edge from-layer="2606" from-port="2" to-layer="2608" to-port="0" /> <edge from-layer="2607" from-port="0" to-layer="2608" to-port="1" /> <edge from-layer="2608" from-port="2" to-layer="2610" to-port="0" /> <edge from-layer="2609" from-port="0" to-layer="2610" to-port="1" /> <edge from-layer="2610" from-port="2" to-layer="2621" to-port="0" /> <edge from-layer="2610" from-port="2" to-layer="2611" to-port="0" /> <edge from-layer="2610" from-port="2" to-layer="2615" to-port="0" /> <edge from-layer="2611" from-port="2" to-layer="2624" to-port="0" /> <edge from-layer="2612" from-port="0" to-layer="2615" to-port="1" /> <edge from-layer="2613" from-port="0" to-layer="2615" to-port="2" /> <edge from-layer="2614" from-port="0" to-layer="2615" to-port="3" /> <edge from-layer="2615" from-port="5" to-layer="2617" to-port="0" /> <edge from-layer="2616" from-port="0" to-layer="2617" to-port="1" /> <edge from-layer="2617" from-port="2" to-layer="2622" to-port="0" /> <edge from-layer="2618" from-port="0" to-layer="2621" to-port="1" /> <edge from-layer="2619" from-port="0" to-layer="2621" to-port="2" /> <edge from-layer="2620" from-port="0" to-layer="2621" to-port="3" /> <edge from-layer="2621" from-port="5" to-layer="2622" to-port="1" /> <edge from-layer="2622" from-port="2" to-layer="2623" to-port="0" /> <edge from-layer="2623" from-port="2" to-layer="2624" to-port="1" /> <edge from-layer="2624" from-port="2" to-layer="2681" to-port="0" /> <edge from-layer="2625" from-port="1" to-layer="2627" to-port="0" /> <edge from-layer="2626" from-port="0" to-layer="2627" to-port="2" /> <edge from-layer="2627" from-port="3" to-layer="2655" to-port="0" /> <edge from-layer="2628" from-port="0" to-layer="2629" to-port="0" /> <edge from-layer="2629" from-port="1" to-layer="2632" to-port="0" /> <edge from-layer="2630" from-port="0" to-layer="2631" to-port="0" /> <edge from-layer="2631" from-port="1" to-layer="2632" to-port="1" /> <edge from-layer="2632" from-port="2" to-layer="2634" to-port="0" /> <edge from-layer="2633" from-port="0" to-layer="2634" to-port="1" /> <edge from-layer="2634" from-port="2" to-layer="2635" to-port="0" /> <edge from-layer="2635" from-port="1" to-layer="2636" to-port="1" /> <edge from-layer="2636" from-port="2" to-layer="2638" to-port="0" /> <edge from-layer="2637" from-port="0" to-layer="2638" to-port="1" /> <edge from-layer="2638" from-port="2" to-layer="2640" to-port="0" /> <edge from-layer="2639" from-port="0" to-layer="2640" to-port="1" /> <edge from-layer="2640" from-port="2" to-layer="2641" to-port="0" /> <edge from-layer="2640" from-port="2" to-layer="2645" to-port="0" /> <edge from-layer="2640" from-port="2" to-layer="2651" to-port="0" /> <edge from-layer="2641" from-port="2" to-layer="2654" to-port="0" /> <edge from-layer="2642" from-port="0" to-layer="2645" to-port="1" /> <edge from-layer="2643" from-port="0" to-layer="2645" to-port="2" /> <edge from-layer="2644" from-port="0" to-layer="2645" to-port="3" /> <edge from-layer="2645" from-port="5" to-layer="2647" to-port="0" /> <edge from-layer="2646" from-port="0" to-layer="2647" to-port="1" /> <edge from-layer="2647" from-port="2" to-layer="2652" to-port="0" /> <edge from-layer="2648" from-port="0" to-layer="2651" to-port="1" /> <edge from-layer="2649" from-port="0" to-layer="2651" to-port="2" /> <edge from-layer="2650" from-port="0" to-layer="2651" to-port="3" /> <edge from-layer="2651" from-port="5" to-layer="2652" to-port="1" /> <edge from-layer="2652" from-port="2" to-layer="2653" to-port="0" /> <edge from-layer="2653" from-port="2" to-layer="2654" to-port="1" /> <edge from-layer="2654" from-port="2" to-layer="2655" to-port="1" /> <edge from-layer="2655" from-port="2" to-layer="2656" to-port="0" /> <edge from-layer="2655" from-port="2" to-layer="6166" to-port="0" /> <edge from-layer="2656" from-port="2" to-layer="2657" to-port="0" /> <edge from-layer="2657" from-port="2" to-layer="2659" to-port="0" /> <edge from-layer="2658" from-port="0" to-layer="2659" to-port="1" /> <edge from-layer="2659" from-port="2" to-layer="2681" to-port="1" /> <edge from-layer="2660" from-port="1" to-layer="2662" to-port="0" /> <edge from-layer="2661" from-port="0" to-layer="2662" to-port="2" /> <edge from-layer="2662" from-port="3" to-layer="2676" to-port="0" /> <edge from-layer="2663" from-port="0" to-layer="2664" to-port="0" /> <edge from-layer="2664" from-port="1" to-layer="2667" to-port="0" /> <edge from-layer="2665" from-port="0" to-layer="2666" to-port="0" /> <edge from-layer="2666" from-port="1" to-layer="2667" to-port="1" /> <edge from-layer="2667" from-port="2" to-layer="2669" to-port="0" /> <edge from-layer="2668" from-port="0" to-layer="2669" to-port="1" /> <edge from-layer="2669" from-port="2" to-layer="2670" to-port="0" /> <edge from-layer="2670" from-port="1" to-layer="2671" to-port="1" /> <edge from-layer="2671" from-port="2" to-layer="2673" to-port="0" /> <edge from-layer="2672" from-port="0" to-layer="2673" to-port="1" /> <edge from-layer="2673" from-port="2" to-layer="2675" to-port="0" /> <edge from-layer="2674" from-port="0" to-layer="2675" to-port="1" /> <edge from-layer="2675" from-port="2" to-layer="2676" to-port="1" /> <edge from-layer="2676" from-port="2" to-layer="2677" to-port="0" /> <edge from-layer="2676" from-port="2" to-layer="6165" to-port="0" /> <edge from-layer="2677" from-port="2" to-layer="2678" to-port="0" /> <edge from-layer="2678" from-port="2" to-layer="2680" to-port="0" /> <edge from-layer="2679" from-port="0" to-layer="2680" to-port="1" /> <edge from-layer="2680" from-port="2" to-layer="2681" to-port="2" /> <edge from-layer="2681" from-port="4" to-layer="2683" to-port="0" /> <edge from-layer="2682" from-port="0" to-layer="2683" to-port="1" /> <edge from-layer="2683" from-port="2" to-layer="2684" to-port="0" /> <edge from-layer="2684" from-port="2" to-layer="2693" to-port="0" /> <edge from-layer="2685" from-port="0" to-layer="2686" to-port="0" /> <edge from-layer="2686" from-port="1" to-layer="2689" to-port="0" /> <edge from-layer="2687" from-port="0" to-layer="2688" to-port="0" /> <edge from-layer="2688" from-port="1" to-layer="2689" to-port="1" /> <edge from-layer="2689" from-port="2" to-layer="2691" to-port="0" /> <edge from-layer="2690" from-port="0" to-layer="2691" to-port="1" /> <edge from-layer="2691" from-port="2" to-layer="2692" to-port="0" /> <edge from-layer="2692" from-port="1" to-layer="2693" to-port="1" /> <edge from-layer="2693" from-port="2" to-layer="2694" to-port="1" /> <edge from-layer="2694" from-port="2" to-layer="2736" to-port="0" /> <edge from-layer="2694" from-port="2" to-layer="2698" to-port="0" /> <edge from-layer="2694" from-port="2" to-layer="2705" to-port="0" /> <edge from-layer="2695" from-port="0" to-layer="2706" to-port="0" /> <edge from-layer="2696" from-port="0" to-layer="2704" to-port="0" /> <edge from-layer="2697" from-port="0" to-layer="2698" to-port="1" /> <edge from-layer="2698" from-port="2" to-layer="2700" to-port="0" /> <edge from-layer="2699" from-port="0" to-layer="2700" to-port="1" /> <edge from-layer="2700" from-port="2" to-layer="2702" to-port="0" /> <edge from-layer="2701" from-port="0" to-layer="2702" to-port="1" /> <edge from-layer="2702" from-port="2" to-layer="2703" to-port="0" /> <edge from-layer="2703" from-port="1" to-layer="2704" to-port="1" /> <edge from-layer="2704" from-port="2" to-layer="2705" to-port="1" /> <edge from-layer="2705" from-port="2" to-layer="2706" to-port="1" /> <edge from-layer="2706" from-port="2" to-layer="2715" to-port="0" /> <edge from-layer="2706" from-port="2" to-layer="2725" to-port="0" /> <edge from-layer="2707" from-port="0" to-layer="2708" to-port="0" /> <edge from-layer="2708" from-port="1" to-layer="2711" to-port="0" /> <edge from-layer="2709" from-port="0" to-layer="2710" to-port="0" /> <edge from-layer="2710" from-port="1" to-layer="2711" to-port="1" /> <edge from-layer="2711" from-port="2" to-layer="2713" to-port="0" /> <edge from-layer="2712" from-port="0" to-layer="2713" to-port="1" /> <edge from-layer="2713" from-port="2" to-layer="2714" to-port="0" /> <edge from-layer="2714" from-port="1" to-layer="2715" to-port="1" /> <edge from-layer="2715" from-port="2" to-layer="2716" to-port="0" /> <edge from-layer="2716" from-port="1" to-layer="2726" to-port="0" /> <edge from-layer="2717" from-port="0" to-layer="2718" to-port="0" /> <edge from-layer="2718" from-port="1" to-layer="2721" to-port="0" /> <edge from-layer="2719" from-port="0" to-layer="2720" to-port="0" /> <edge from-layer="2720" from-port="1" to-layer="2721" to-port="1" /> <edge from-layer="2721" from-port="2" to-layer="2723" to-port="0" /> <edge from-layer="2722" from-port="0" to-layer="2723" to-port="1" /> <edge from-layer="2723" from-port="2" to-layer="2724" to-port="0" /> <edge from-layer="2724" from-port="1" to-layer="2725" to-port="1" /> <edge from-layer="2725" from-port="2" to-layer="2726" to-port="1" /> <edge from-layer="2726" from-port="2" to-layer="2735" to-port="0" /> <edge from-layer="2727" from-port="0" to-layer="2728" to-port="0" /> <edge from-layer="2728" from-port="1" to-layer="2731" to-port="0" /> <edge from-layer="2729" from-port="0" to-layer="2730" to-port="0" /> <edge from-layer="2730" from-port="1" to-layer="2731" to-port="1" /> <edge from-layer="2731" from-port="2" to-layer="2733" to-port="0" /> <edge from-layer="2732" from-port="0" to-layer="2733" to-port="1" /> <edge from-layer="2733" from-port="2" to-layer="2734" to-port="0" /> <edge from-layer="2734" from-port="1" to-layer="2735" to-port="1" /> <edge from-layer="2735" from-port="2" to-layer="2736" to-port="1" /> <edge from-layer="2736" from-port="2" to-layer="2740" to-port="0" /> <edge from-layer="2736" from-port="2" to-layer="2845" to-port="0" /> <edge from-layer="2736" from-port="2" to-layer="2747" to-port="0" /> <edge from-layer="2737" from-port="0" to-layer="2748" to-port="0" /> <edge from-layer="2738" from-port="0" to-layer="2746" to-port="0" /> <edge from-layer="2739" from-port="0" to-layer="2740" to-port="1" /> <edge from-layer="2740" from-port="2" to-layer="2742" to-port="0" /> <edge from-layer="2741" from-port="0" to-layer="2742" to-port="1" /> <edge from-layer="2742" from-port="2" to-layer="2744" to-port="0" /> <edge from-layer="2743" from-port="0" to-layer="2744" to-port="1" /> <edge from-layer="2744" from-port="2" to-layer="2745" to-port="0" /> <edge from-layer="2745" from-port="1" to-layer="2746" to-port="1" /> <edge from-layer="2746" from-port="2" to-layer="2747" to-port="1" /> <edge from-layer="2747" from-port="2" to-layer="2748" to-port="1" /> <edge from-layer="2748" from-port="2" to-layer="2787" to-port="0" /> <edge from-layer="2748" from-port="2" to-layer="2822" to-port="0" /> <edge from-layer="2748" from-port="2" to-layer="2757" to-port="0" /> <edge from-layer="2749" from-port="0" to-layer="2750" to-port="0" /> <edge from-layer="2750" from-port="1" to-layer="2753" to-port="0" /> <edge from-layer="2751" from-port="0" to-layer="2752" to-port="0" /> <edge from-layer="2752" from-port="1" to-layer="2753" to-port="1" /> <edge from-layer="2753" from-port="2" to-layer="2755" to-port="0" /> <edge from-layer="2754" from-port="0" to-layer="2755" to-port="1" /> <edge from-layer="2755" from-port="2" to-layer="2756" to-port="0" /> <edge from-layer="2756" from-port="1" to-layer="2757" to-port="1" /> <edge from-layer="2757" from-port="2" to-layer="2759" to-port="0" /> <edge from-layer="2758" from-port="0" to-layer="2759" to-port="1" /> <edge from-layer="2759" from-port="2" to-layer="2761" to-port="0" /> <edge from-layer="2760" from-port="0" to-layer="2761" to-port="1" /> <edge from-layer="2761" from-port="2" to-layer="2762" to-port="0" /> <edge from-layer="2761" from-port="2" to-layer="2766" to-port="0" /> <edge from-layer="2761" from-port="2" to-layer="2772" to-port="0" /> <edge from-layer="2762" from-port="2" to-layer="2775" to-port="0" /> <edge from-layer="2763" from-port="0" to-layer="2766" to-port="1" /> <edge from-layer="2764" from-port="0" to-layer="2766" to-port="2" /> <edge from-layer="2765" from-port="0" to-layer="2766" to-port="3" /> <edge from-layer="2766" from-port="5" to-layer="2768" to-port="0" /> <edge from-layer="2767" from-port="0" to-layer="2768" to-port="1" /> <edge from-layer="2768" from-port="2" to-layer="2773" to-port="0" /> <edge from-layer="2769" from-port="0" to-layer="2772" to-port="1" /> <edge from-layer="2770" from-port="0" to-layer="2772" to-port="2" /> <edge from-layer="2771" from-port="0" to-layer="2772" to-port="3" /> <edge from-layer="2772" from-port="5" to-layer="2773" to-port="1" /> <edge from-layer="2773" from-port="2" to-layer="2774" to-port="0" /> <edge from-layer="2774" from-port="2" to-layer="2775" to-port="1" /> <edge from-layer="2775" from-port="2" to-layer="2832" to-port="0" /> <edge from-layer="2776" from-port="1" to-layer="2778" to-port="0" /> <edge from-layer="2777" from-port="0" to-layer="2778" to-port="2" /> <edge from-layer="2778" from-port="3" to-layer="2806" to-port="0" /> <edge from-layer="2779" from-port="0" to-layer="2780" to-port="0" /> <edge from-layer="2780" from-port="1" to-layer="2783" to-port="0" /> <edge from-layer="2781" from-port="0" to-layer="2782" to-port="0" /> <edge from-layer="2782" from-port="1" to-layer="2783" to-port="1" /> <edge from-layer="2783" from-port="2" to-layer="2785" to-port="0" /> <edge from-layer="2784" from-port="0" to-layer="2785" to-port="1" /> <edge from-layer="2785" from-port="2" to-layer="2786" to-port="0" /> <edge from-layer="2786" from-port="1" to-layer="2787" to-port="1" /> <edge from-layer="2787" from-port="2" to-layer="2789" to-port="0" /> <edge from-layer="2788" from-port="0" to-layer="2789" to-port="1" /> <edge from-layer="2789" from-port="2" to-layer="2791" to-port="0" /> <edge from-layer="2790" from-port="0" to-layer="2791" to-port="1" /> <edge from-layer="2791" from-port="2" to-layer="2802" to-port="0" /> <edge from-layer="2791" from-port="2" to-layer="2796" to-port="0" /> <edge from-layer="2791" from-port="2" to-layer="2792" to-port="0" /> <edge from-layer="2792" from-port="2" to-layer="2805" to-port="0" /> <edge from-layer="2793" from-port="0" to-layer="2796" to-port="1" /> <edge from-layer="2794" from-port="0" to-layer="2796" to-port="2" /> <edge from-layer="2795" from-port="0" to-layer="2796" to-port="3" /> <edge from-layer="2796" from-port="5" to-layer="2798" to-port="0" /> <edge from-layer="2797" from-port="0" to-layer="2798" to-port="1" /> <edge from-layer="2798" from-port="2" to-layer="2803" to-port="0" /> <edge from-layer="2799" from-port="0" to-layer="2802" to-port="1" /> <edge from-layer="2800" from-port="0" to-layer="2802" to-port="2" /> <edge from-layer="2801" from-port="0" to-layer="2802" to-port="3" /> <edge from-layer="2802" from-port="5" to-layer="2803" to-port="1" /> <edge from-layer="2803" from-port="2" to-layer="2804" to-port="0" /> <edge from-layer="2804" from-port="2" to-layer="2805" to-port="1" /> <edge from-layer="2805" from-port="2" to-layer="2806" to-port="1" /> <edge from-layer="2806" from-port="2" to-layer="6164" to-port="0" /> <edge from-layer="2806" from-port="2" to-layer="2807" to-port="0" /> <edge from-layer="2807" from-port="2" to-layer="2808" to-port="0" /> <edge from-layer="2808" from-port="2" to-layer="2810" to-port="0" /> <edge from-layer="2809" from-port="0" to-layer="2810" to-port="1" /> <edge from-layer="2810" from-port="2" to-layer="2832" to-port="1" /> <edge from-layer="2811" from-port="1" to-layer="2813" to-port="0" /> <edge from-layer="2812" from-port="0" to-layer="2813" to-port="2" /> <edge from-layer="2813" from-port="3" to-layer="2827" to-port="0" /> <edge from-layer="2814" from-port="0" to-layer="2815" to-port="0" /> <edge from-layer="2815" from-port="1" to-layer="2818" to-port="0" /> <edge from-layer="2816" from-port="0" to-layer="2817" to-port="0" /> <edge from-layer="2817" from-port="1" to-layer="2818" to-port="1" /> <edge from-layer="2818" from-port="2" to-layer="2820" to-port="0" /> <edge from-layer="2819" from-port="0" to-layer="2820" to-port="1" /> <edge from-layer="2820" from-port="2" to-layer="2821" to-port="0" /> <edge from-layer="2821" from-port="1" to-layer="2822" to-port="1" /> <edge from-layer="2822" from-port="2" to-layer="2824" to-port="0" /> <edge from-layer="2823" from-port="0" to-layer="2824" to-port="1" /> <edge from-layer="2824" from-port="2" to-layer="2826" to-port="0" /> <edge from-layer="2825" from-port="0" to-layer="2826" to-port="1" /> <edge from-layer="2826" from-port="2" to-layer="2827" to-port="1" /> <edge from-layer="2827" from-port="2" to-layer="6163" to-port="0" /> <edge from-layer="2827" from-port="2" to-layer="2828" to-port="0" /> <edge from-layer="2828" from-port="2" to-layer="2829" to-port="0" /> <edge from-layer="2829" from-port="2" to-layer="2831" to-port="0" /> <edge from-layer="2830" from-port="0" to-layer="2831" to-port="1" /> <edge from-layer="2831" from-port="2" to-layer="2832" to-port="2" /> <edge from-layer="2832" from-port="4" to-layer="2834" to-port="0" /> <edge from-layer="2833" from-port="0" to-layer="2834" to-port="1" /> <edge from-layer="2834" from-port="2" to-layer="2835" to-port="0" /> <edge from-layer="2835" from-port="2" to-layer="2844" to-port="0" /> <edge from-layer="2836" from-port="0" to-layer="2837" to-port="0" /> <edge from-layer="2837" from-port="1" to-layer="2840" to-port="0" /> <edge from-layer="2838" from-port="0" to-layer="2839" to-port="0" /> <edge from-layer="2839" from-port="1" to-layer="2840" to-port="1" /> <edge from-layer="2840" from-port="2" to-layer="2842" to-port="0" /> <edge from-layer="2841" from-port="0" to-layer="2842" to-port="1" /> <edge from-layer="2842" from-port="2" to-layer="2843" to-port="0" /> <edge from-layer="2843" from-port="1" to-layer="2844" to-port="1" /> <edge from-layer="2844" from-port="2" to-layer="2845" to-port="1" /> <edge from-layer="2845" from-port="2" to-layer="2849" to-port="0" /> <edge from-layer="2845" from-port="2" to-layer="2887" to-port="0" /> <edge from-layer="2845" from-port="2" to-layer="2856" to-port="0" /> <edge from-layer="2846" from-port="0" to-layer="2857" to-port="0" /> <edge from-layer="2847" from-port="0" to-layer="2855" to-port="0" /> <edge from-layer="2848" from-port="0" to-layer="2849" to-port="1" /> <edge from-layer="2849" from-port="2" to-layer="2851" to-port="0" /> <edge from-layer="2850" from-port="0" to-layer="2851" to-port="1" /> <edge from-layer="2851" from-port="2" to-layer="2853" to-port="0" /> <edge from-layer="2852" from-port="0" to-layer="2853" to-port="1" /> <edge from-layer="2853" from-port="2" to-layer="2854" to-port="0" /> <edge from-layer="2854" from-port="1" to-layer="2855" to-port="1" /> <edge from-layer="2855" from-port="2" to-layer="2856" to-port="1" /> <edge from-layer="2856" from-port="2" to-layer="2857" to-port="1" /> <edge from-layer="2857" from-port="2" to-layer="2876" to-port="0" /> <edge from-layer="2857" from-port="2" to-layer="2866" to-port="0" /> <edge from-layer="2858" from-port="0" to-layer="2859" to-port="0" /> <edge from-layer="2859" from-port="1" to-layer="2862" to-port="0" /> <edge from-layer="2860" from-port="0" to-layer="2861" to-port="0" /> <edge from-layer="2861" from-port="1" to-layer="2862" to-port="1" /> <edge from-layer="2862" from-port="2" to-layer="2864" to-port="0" /> <edge from-layer="2863" from-port="0" to-layer="2864" to-port="1" /> <edge from-layer="2864" from-port="2" to-layer="2865" to-port="0" /> <edge from-layer="2865" from-port="1" to-layer="2866" to-port="1" /> <edge from-layer="2866" from-port="2" to-layer="2867" to-port="0" /> <edge from-layer="2867" from-port="1" to-layer="2877" to-port="0" /> <edge from-layer="2868" from-port="0" to-layer="2869" to-port="0" /> <edge from-layer="2869" from-port="1" to-layer="2872" to-port="0" /> <edge from-layer="2870" from-port="0" to-layer="2871" to-port="0" /> <edge from-layer="2871" from-port="1" to-layer="2872" to-port="1" /> <edge from-layer="2872" from-port="2" to-layer="2874" to-port="0" /> <edge from-layer="2873" from-port="0" to-layer="2874" to-port="1" /> <edge from-layer="2874" from-port="2" to-layer="2875" to-port="0" /> <edge from-layer="2875" from-port="1" to-layer="2876" to-port="1" /> <edge from-layer="2876" from-port="2" to-layer="2877" to-port="1" /> <edge from-layer="2877" from-port="2" to-layer="2886" to-port="0" /> <edge from-layer="2878" from-port="0" to-layer="2879" to-port="0" /> <edge from-layer="2879" from-port="1" to-layer="2882" to-port="0" /> <edge from-layer="2880" from-port="0" to-layer="2881" to-port="0" /> <edge from-layer="2881" from-port="1" to-layer="2882" to-port="1" /> <edge from-layer="2882" from-port="2" to-layer="2884" to-port="0" /> <edge from-layer="2883" from-port="0" to-layer="2884" to-port="1" /> <edge from-layer="2884" from-port="2" to-layer="2885" to-port="0" /> <edge from-layer="2885" from-port="1" to-layer="2886" to-port="1" /> <edge from-layer="2886" from-port="2" to-layer="2887" to-port="1" /> <edge from-layer="2887" from-port="2" to-layer="2891" to-port="0" /> <edge from-layer="2887" from-port="2" to-layer="2898" to-port="0" /> <edge from-layer="2887" from-port="2" to-layer="2996" to-port="0" /> <edge from-layer="2888" from-port="0" to-layer="2899" to-port="0" /> <edge from-layer="2889" from-port="0" to-layer="2897" to-port="0" /> <edge from-layer="2890" from-port="0" to-layer="2891" to-port="1" /> <edge from-layer="2891" from-port="2" to-layer="2893" to-port="0" /> <edge from-layer="2892" from-port="0" to-layer="2893" to-port="1" /> <edge from-layer="2893" from-port="2" to-layer="2895" to-port="0" /> <edge from-layer="2894" from-port="0" to-layer="2895" to-port="1" /> <edge from-layer="2895" from-port="2" to-layer="2896" to-port="0" /> <edge from-layer="2896" from-port="1" to-layer="2897" to-port="1" /> <edge from-layer="2897" from-port="2" to-layer="2898" to-port="1" /> <edge from-layer="2898" from-port="2" to-layer="2899" to-port="1" /> <edge from-layer="2899" from-port="2" to-layer="2938" to-port="0" /> <edge from-layer="2899" from-port="2" to-layer="2973" to-port="0" /> <edge from-layer="2899" from-port="2" to-layer="2908" to-port="0" /> <edge from-layer="2900" from-port="0" to-layer="2901" to-port="0" /> <edge from-layer="2901" from-port="1" to-layer="2904" to-port="0" /> <edge from-layer="2902" from-port="0" to-layer="2903" to-port="0" /> <edge from-layer="2903" from-port="1" to-layer="2904" to-port="1" /> <edge from-layer="2904" from-port="2" to-layer="2906" to-port="0" /> <edge from-layer="2905" from-port="0" to-layer="2906" to-port="1" /> <edge from-layer="2906" from-port="2" to-layer="2907" to-port="0" /> <edge from-layer="2907" from-port="1" to-layer="2908" to-port="1" /> <edge from-layer="2908" from-port="2" to-layer="2910" to-port="0" /> <edge from-layer="2909" from-port="0" to-layer="2910" to-port="1" /> <edge from-layer="2910" from-port="2" to-layer="2912" to-port="0" /> <edge from-layer="2911" from-port="0" to-layer="2912" to-port="1" /> <edge from-layer="2912" from-port="2" to-layer="2913" to-port="0" /> <edge from-layer="2912" from-port="2" to-layer="2917" to-port="0" /> <edge from-layer="2912" from-port="2" to-layer="2923" to-port="0" /> <edge from-layer="2913" from-port="2" to-layer="2926" to-port="0" /> <edge from-layer="2914" from-port="0" to-layer="2917" to-port="1" /> <edge from-layer="2915" from-port="0" to-layer="2917" to-port="2" /> <edge from-layer="2916" from-port="0" to-layer="2917" to-port="3" /> <edge from-layer="2917" from-port="5" to-layer="2919" to-port="0" /> <edge from-layer="2918" from-port="0" to-layer="2919" to-port="1" /> <edge from-layer="2919" from-port="2" to-layer="2924" to-port="0" /> <edge from-layer="2920" from-port="0" to-layer="2923" to-port="1" /> <edge from-layer="2921" from-port="0" to-layer="2923" to-port="2" /> <edge from-layer="2922" from-port="0" to-layer="2923" to-port="3" /> <edge from-layer="2923" from-port="5" to-layer="2924" to-port="1" /> <edge from-layer="2924" from-port="2" to-layer="2925" to-port="0" /> <edge from-layer="2925" from-port="2" to-layer="2926" to-port="1" /> <edge from-layer="2926" from-port="2" to-layer="2983" to-port="0" /> <edge from-layer="2927" from-port="1" to-layer="2929" to-port="0" /> <edge from-layer="2928" from-port="0" to-layer="2929" to-port="2" /> <edge from-layer="2929" from-port="3" to-layer="2957" to-port="0" /> <edge from-layer="2930" from-port="0" to-layer="2931" to-port="0" /> <edge from-layer="2931" from-port="1" to-layer="2934" to-port="0" /> <edge from-layer="2932" from-port="0" to-layer="2933" to-port="0" /> <edge from-layer="2933" from-port="1" to-layer="2934" to-port="1" /> <edge from-layer="2934" from-port="2" to-layer="2936" to-port="0" /> <edge from-layer="2935" from-port="0" to-layer="2936" to-port="1" /> <edge from-layer="2936" from-port="2" to-layer="2937" to-port="0" /> <edge from-layer="2937" from-port="1" to-layer="2938" to-port="1" /> <edge from-layer="2938" from-port="2" to-layer="2940" to-port="0" /> <edge from-layer="2939" from-port="0" to-layer="2940" to-port="1" /> <edge from-layer="2940" from-port="2" to-layer="2942" to-port="0" /> <edge from-layer="2941" from-port="0" to-layer="2942" to-port="1" /> <edge from-layer="2942" from-port="2" to-layer="2953" to-port="0" /> <edge from-layer="2942" from-port="2" to-layer="2943" to-port="0" /> <edge from-layer="2942" from-port="2" to-layer="2947" to-port="0" /> <edge from-layer="2943" from-port="2" to-layer="2956" to-port="0" /> <edge from-layer="2944" from-port="0" to-layer="2947" to-port="1" /> <edge from-layer="2945" from-port="0" to-layer="2947" to-port="2" /> <edge from-layer="2946" from-port="0" to-layer="2947" to-port="3" /> <edge from-layer="2947" from-port="5" to-layer="2949" to-port="0" /> <edge from-layer="2948" from-port="0" to-layer="2949" to-port="1" /> <edge from-layer="2949" from-port="2" to-layer="2954" to-port="0" /> <edge from-layer="2950" from-port="0" to-layer="2953" to-port="1" /> <edge from-layer="2951" from-port="0" to-layer="2953" to-port="2" /> <edge from-layer="2952" from-port="0" to-layer="2953" to-port="3" /> <edge from-layer="2953" from-port="5" to-layer="2954" to-port="1" /> <edge from-layer="2954" from-port="2" to-layer="2955" to-port="0" /> <edge from-layer="2955" from-port="2" to-layer="2956" to-port="1" /> <edge from-layer="2956" from-port="2" to-layer="2957" to-port="1" /> <edge from-layer="2957" from-port="2" to-layer="6162" to-port="0" /> <edge from-layer="2957" from-port="2" to-layer="2958" to-port="0" /> <edge from-layer="2958" from-port="2" to-layer="2959" to-port="0" /> <edge from-layer="2959" from-port="2" to-layer="2961" to-port="0" /> <edge from-layer="2960" from-port="0" to-layer="2961" to-port="1" /> <edge from-layer="2961" from-port="2" to-layer="2983" to-port="1" /> <edge from-layer="2962" from-port="1" to-layer="2964" to-port="0" /> <edge from-layer="2963" from-port="0" to-layer="2964" to-port="2" /> <edge from-layer="2964" from-port="3" to-layer="2978" to-port="0" /> <edge from-layer="2965" from-port="0" to-layer="2966" to-port="0" /> <edge from-layer="2966" from-port="1" to-layer="2969" to-port="0" /> <edge from-layer="2967" from-port="0" to-layer="2968" to-port="0" /> <edge from-layer="2968" from-port="1" to-layer="2969" to-port="1" /> <edge from-layer="2969" from-port="2" to-layer="2971" to-port="0" /> <edge from-layer="2970" from-port="0" to-layer="2971" to-port="1" /> <edge from-layer="2971" from-port="2" to-layer="2972" to-port="0" /> <edge from-layer="2972" from-port="1" to-layer="2973" to-port="1" /> <edge from-layer="2973" from-port="2" to-layer="2975" to-port="0" /> <edge from-layer="2974" from-port="0" to-layer="2975" to-port="1" /> <edge from-layer="2975" from-port="2" to-layer="2977" to-port="0" /> <edge from-layer="2976" from-port="0" to-layer="2977" to-port="1" /> <edge from-layer="2977" from-port="2" to-layer="2978" to-port="1" /> <edge from-layer="2978" from-port="2" to-layer="2979" to-port="0" /> <edge from-layer="2978" from-port="2" to-layer="6161" to-port="0" /> <edge from-layer="2979" from-port="2" to-layer="2980" to-port="0" /> <edge from-layer="2980" from-port="2" to-layer="2982" to-port="0" /> <edge from-layer="2981" from-port="0" to-layer="2982" to-port="1" /> <edge from-layer="2982" from-port="2" to-layer="2983" to-port="2" /> <edge from-layer="2983" from-port="4" to-layer="2985" to-port="0" /> <edge from-layer="2984" from-port="0" to-layer="2985" to-port="1" /> <edge from-layer="2985" from-port="2" to-layer="2986" to-port="0" /> <edge from-layer="2986" from-port="2" to-layer="2995" to-port="0" /> <edge from-layer="2987" from-port="0" to-layer="2988" to-port="0" /> <edge from-layer="2988" from-port="1" to-layer="2991" to-port="0" /> <edge from-layer="2989" from-port="0" to-layer="2990" to-port="0" /> <edge from-layer="2990" from-port="1" to-layer="2991" to-port="1" /> <edge from-layer="2991" from-port="2" to-layer="2993" to-port="0" /> <edge from-layer="2992" from-port="0" to-layer="2993" to-port="1" /> <edge from-layer="2993" from-port="2" to-layer="2994" to-port="0" /> <edge from-layer="2994" from-port="1" to-layer="2995" to-port="1" /> <edge from-layer="2995" from-port="2" to-layer="2996" to-port="1" /> <edge from-layer="2996" from-port="2" to-layer="3000" to-port="0" /> <edge from-layer="2996" from-port="2" to-layer="3007" to-port="0" /> <edge from-layer="2996" from-port="2" to-layer="3038" to-port="0" /> <edge from-layer="2997" from-port="0" to-layer="3008" to-port="0" /> <edge from-layer="2998" from-port="0" to-layer="3006" to-port="0" /> <edge from-layer="2999" from-port="0" to-layer="3000" to-port="1" /> <edge from-layer="3000" from-port="2" to-layer="3002" to-port="0" /> <edge from-layer="3001" from-port="0" to-layer="3002" to-port="1" /> <edge from-layer="3002" from-port="2" to-layer="3004" to-port="0" /> <edge from-layer="3003" from-port="0" to-layer="3004" to-port="1" /> <edge from-layer="3004" from-port="2" to-layer="3005" to-port="0" /> <edge from-layer="3005" from-port="1" to-layer="3006" to-port="1" /> <edge from-layer="3006" from-port="2" to-layer="3007" to-port="1" /> <edge from-layer="3007" from-port="2" to-layer="3008" to-port="1" /> <edge from-layer="3008" from-port="2" to-layer="3017" to-port="0" /> <edge from-layer="3008" from-port="2" to-layer="3027" to-port="0" /> <edge from-layer="3009" from-port="0" to-layer="3010" to-port="0" /> <edge from-layer="3010" from-port="1" to-layer="3013" to-port="0" /> <edge from-layer="3011" from-port="0" to-layer="3012" to-port="0" /> <edge from-layer="3012" from-port="1" to-layer="3013" to-port="1" /> <edge from-layer="3013" from-port="2" to-layer="3015" to-port="0" /> <edge from-layer="3014" from-port="0" to-layer="3015" to-port="1" /> <edge from-layer="3015" from-port="2" to-layer="3016" to-port="0" /> <edge from-layer="3016" from-port="1" to-layer="3017" to-port="1" /> <edge from-layer="3017" from-port="2" to-layer="3018" to-port="0" /> <edge from-layer="3018" from-port="1" to-layer="3028" to-port="0" /> <edge from-layer="3019" from-port="0" to-layer="3020" to-port="0" /> <edge from-layer="3020" from-port="1" to-layer="3023" to-port="0" /> <edge from-layer="3021" from-port="0" to-layer="3022" to-port="0" /> <edge from-layer="3022" from-port="1" to-layer="3023" to-port="1" /> <edge from-layer="3023" from-port="2" to-layer="3025" to-port="0" /> <edge from-layer="3024" from-port="0" to-layer="3025" to-port="1" /> <edge from-layer="3025" from-port="2" to-layer="3026" to-port="0" /> <edge from-layer="3026" from-port="1" to-layer="3027" to-port="1" /> <edge from-layer="3027" from-port="2" to-layer="3028" to-port="1" /> <edge from-layer="3028" from-port="2" to-layer="3037" to-port="0" /> <edge from-layer="3029" from-port="0" to-layer="3030" to-port="0" /> <edge from-layer="3030" from-port="1" to-layer="3033" to-port="0" /> <edge from-layer="3031" from-port="0" to-layer="3032" to-port="0" /> <edge from-layer="3032" from-port="1" to-layer="3033" to-port="1" /> <edge from-layer="3033" from-port="2" to-layer="3035" to-port="0" /> <edge from-layer="3034" from-port="0" to-layer="3035" to-port="1" /> <edge from-layer="3035" from-port="2" to-layer="3036" to-port="0" /> <edge from-layer="3036" from-port="1" to-layer="3037" to-port="1" /> <edge from-layer="3037" from-port="2" to-layer="3038" to-port="1" /> <edge from-layer="3038" from-port="2" to-layer="3147" to-port="0" /> <edge from-layer="3038" from-port="2" to-layer="3049" to-port="0" /> <edge from-layer="3038" from-port="2" to-layer="3042" to-port="0" /> <edge from-layer="3039" from-port="0" to-layer="3050" to-port="0" /> <edge from-layer="3040" from-port="0" to-layer="3048" to-port="0" /> <edge from-layer="3041" from-port="0" to-layer="3042" to-port="1" /> <edge from-layer="3042" from-port="2" to-layer="3044" to-port="0" /> <edge from-layer="3043" from-port="0" to-layer="3044" to-port="1" /> <edge from-layer="3044" from-port="2" to-layer="3046" to-port="0" /> <edge from-layer="3045" from-port="0" to-layer="3046" to-port="1" /> <edge from-layer="3046" from-port="2" to-layer="3047" to-port="0" /> <edge from-layer="3047" from-port="1" to-layer="3048" to-port="1" /> <edge from-layer="3048" from-port="2" to-layer="3049" to-port="1" /> <edge from-layer="3049" from-port="2" to-layer="3050" to-port="1" /> <edge from-layer="3050" from-port="2" to-layer="3089" to-port="0" /> <edge from-layer="3050" from-port="2" to-layer="3059" to-port="0" /> <edge from-layer="3050" from-port="2" to-layer="3124" to-port="0" /> <edge from-layer="3051" from-port="0" to-layer="3052" to-port="0" /> <edge from-layer="3052" from-port="1" to-layer="3055" to-port="0" /> <edge from-layer="3053" from-port="0" to-layer="3054" to-port="0" /> <edge from-layer="3054" from-port="1" to-layer="3055" to-port="1" /> <edge from-layer="3055" from-port="2" to-layer="3057" to-port="0" /> <edge from-layer="3056" from-port="0" to-layer="3057" to-port="1" /> <edge from-layer="3057" from-port="2" to-layer="3058" to-port="0" /> <edge from-layer="3058" from-port="1" to-layer="3059" to-port="1" /> <edge from-layer="3059" from-port="2" to-layer="3061" to-port="0" /> <edge from-layer="3060" from-port="0" to-layer="3061" to-port="1" /> <edge from-layer="3061" from-port="2" to-layer="3063" to-port="0" /> <edge from-layer="3062" from-port="0" to-layer="3063" to-port="1" /> <edge from-layer="3063" from-port="2" to-layer="3064" to-port="0" /> <edge from-layer="3063" from-port="2" to-layer="3068" to-port="0" /> <edge from-layer="3063" from-port="2" to-layer="3074" to-port="0" /> <edge from-layer="3064" from-port="2" to-layer="3077" to-port="0" /> <edge from-layer="3065" from-port="0" to-layer="3068" to-port="1" /> <edge from-layer="3066" from-port="0" to-layer="3068" to-port="2" /> <edge from-layer="3067" from-port="0" to-layer="3068" to-port="3" /> <edge from-layer="3068" from-port="5" to-layer="3070" to-port="0" /> <edge from-layer="3069" from-port="0" to-layer="3070" to-port="1" /> <edge from-layer="3070" from-port="2" to-layer="3075" to-port="0" /> <edge from-layer="3071" from-port="0" to-layer="3074" to-port="1" /> <edge from-layer="3072" from-port="0" to-layer="3074" to-port="2" /> <edge from-layer="3073" from-port="0" to-layer="3074" to-port="3" /> <edge from-layer="3074" from-port="5" to-layer="3075" to-port="1" /> <edge from-layer="3075" from-port="2" to-layer="3076" to-port="0" /> <edge from-layer="3076" from-port="2" to-layer="3077" to-port="1" /> <edge from-layer="3077" from-port="2" to-layer="3134" to-port="0" /> <edge from-layer="3078" from-port="1" to-layer="3080" to-port="0" /> <edge from-layer="3079" from-port="0" to-layer="3080" to-port="2" /> <edge from-layer="3080" from-port="3" to-layer="3108" to-port="0" /> <edge from-layer="3081" from-port="0" to-layer="3082" to-port="0" /> <edge from-layer="3082" from-port="1" to-layer="3085" to-port="0" /> <edge from-layer="3083" from-port="0" to-layer="3084" to-port="0" /> <edge from-layer="3084" from-port="1" to-layer="3085" to-port="1" /> <edge from-layer="3085" from-port="2" to-layer="3087" to-port="0" /> <edge from-layer="3086" from-port="0" to-layer="3087" to-port="1" /> <edge from-layer="3087" from-port="2" to-layer="3088" to-port="0" /> <edge from-layer="3088" from-port="1" to-layer="3089" to-port="1" /> <edge from-layer="3089" from-port="2" to-layer="3091" to-port="0" /> <edge from-layer="3090" from-port="0" to-layer="3091" to-port="1" /> <edge from-layer="3091" from-port="2" to-layer="3093" to-port="0" /> <edge from-layer="3092" from-port="0" to-layer="3093" to-port="1" /> <edge from-layer="3093" from-port="2" to-layer="3094" to-port="0" /> <edge from-layer="3093" from-port="2" to-layer="3098" to-port="0" /> <edge from-layer="3093" from-port="2" to-layer="3104" to-port="0" /> <edge from-layer="3094" from-port="2" to-layer="3107" to-port="0" /> <edge from-layer="3095" from-port="0" to-layer="3098" to-port="1" /> <edge from-layer="3096" from-port="0" to-layer="3098" to-port="2" /> <edge from-layer="3097" from-port="0" to-layer="3098" to-port="3" /> <edge from-layer="3098" from-port="5" to-layer="3100" to-port="0" /> <edge from-layer="3099" from-port="0" to-layer="3100" to-port="1" /> <edge from-layer="3100" from-port="2" to-layer="3105" to-port="0" /> <edge from-layer="3101" from-port="0" to-layer="3104" to-port="1" /> <edge from-layer="3102" from-port="0" to-layer="3104" to-port="2" /> <edge from-layer="3103" from-port="0" to-layer="3104" to-port="3" /> <edge from-layer="3104" from-port="5" to-layer="3105" to-port="1" /> <edge from-layer="3105" from-port="2" to-layer="3106" to-port="0" /> <edge from-layer="3106" from-port="2" to-layer="3107" to-port="1" /> <edge from-layer="3107" from-port="2" to-layer="3108" to-port="1" /> <edge from-layer="3108" from-port="2" to-layer="6160" to-port="0" /> <edge from-layer="3108" from-port="2" to-layer="3109" to-port="0" /> <edge from-layer="3109" from-port="2" to-layer="3110" to-port="0" /> <edge from-layer="3110" from-port="2" to-layer="3112" to-port="0" /> <edge from-layer="3111" from-port="0" to-layer="3112" to-port="1" /> <edge from-layer="3112" from-port="2" to-layer="3134" to-port="1" /> <edge from-layer="3113" from-port="1" to-layer="3115" to-port="0" /> <edge from-layer="3114" from-port="0" to-layer="3115" to-port="2" /> <edge from-layer="3115" from-port="3" to-layer="3129" to-port="0" /> <edge from-layer="3116" from-port="0" to-layer="3117" to-port="0" /> <edge from-layer="3117" from-port="1" to-layer="3120" to-port="0" /> <edge from-layer="3118" from-port="0" to-layer="3119" to-port="0" /> <edge from-layer="3119" from-port="1" to-layer="3120" to-port="1" /> <edge from-layer="3120" from-port="2" to-layer="3122" to-port="0" /> <edge from-layer="3121" from-port="0" to-layer="3122" to-port="1" /> <edge from-layer="3122" from-port="2" to-layer="3123" to-port="0" /> <edge from-layer="3123" from-port="1" to-layer="3124" to-port="1" /> <edge from-layer="3124" from-port="2" to-layer="3126" to-port="0" /> <edge from-layer="3125" from-port="0" to-layer="3126" to-port="1" /> <edge from-layer="3126" from-port="2" to-layer="3128" to-port="0" /> <edge from-layer="3127" from-port="0" to-layer="3128" to-port="1" /> <edge from-layer="3128" from-port="2" to-layer="3129" to-port="1" /> <edge from-layer="3129" from-port="2" to-layer="3130" to-port="0" /> <edge from-layer="3129" from-port="2" to-layer="6159" to-port="0" /> <edge from-layer="3130" from-port="2" to-layer="3131" to-port="0" /> <edge from-layer="3131" from-port="2" to-layer="3133" to-port="0" /> <edge from-layer="3132" from-port="0" to-layer="3133" to-port="1" /> <edge from-layer="3133" from-port="2" to-layer="3134" to-port="2" /> <edge from-layer="3134" from-port="4" to-layer="3136" to-port="0" /> <edge from-layer="3135" from-port="0" to-layer="3136" to-port="1" /> <edge from-layer="3136" from-port="2" to-layer="3137" to-port="0" /> <edge from-layer="3137" from-port="2" to-layer="3146" to-port="0" /> <edge from-layer="3138" from-port="0" to-layer="3139" to-port="0" /> <edge from-layer="3139" from-port="1" to-layer="3142" to-port="0" /> <edge from-layer="3140" from-port="0" to-layer="3141" to-port="0" /> <edge from-layer="3141" from-port="1" to-layer="3142" to-port="1" /> <edge from-layer="3142" from-port="2" to-layer="3144" to-port="0" /> <edge from-layer="3143" from-port="0" to-layer="3144" to-port="1" /> <edge from-layer="3144" from-port="2" to-layer="3145" to-port="0" /> <edge from-layer="3145" from-port="1" to-layer="3146" to-port="1" /> <edge from-layer="3146" from-port="2" to-layer="3147" to-port="1" /> <edge from-layer="3147" from-port="2" to-layer="3151" to-port="0" /> <edge from-layer="3147" from-port="2" to-layer="3158" to-port="0" /> <edge from-layer="3147" from-port="2" to-layer="3189" to-port="0" /> <edge from-layer="3148" from-port="0" to-layer="3159" to-port="0" /> <edge from-layer="3149" from-port="0" to-layer="3157" to-port="0" /> <edge from-layer="3150" from-port="0" to-layer="3151" to-port="1" /> <edge from-layer="3151" from-port="2" to-layer="3153" to-port="0" /> <edge from-layer="3152" from-port="0" to-layer="3153" to-port="1" /> <edge from-layer="3153" from-port="2" to-layer="3155" to-port="0" /> <edge from-layer="3154" from-port="0" to-layer="3155" to-port="1" /> <edge from-layer="3155" from-port="2" to-layer="3156" to-port="0" /> <edge from-layer="3156" from-port="1" to-layer="3157" to-port="1" /> <edge from-layer="3157" from-port="2" to-layer="3158" to-port="1" /> <edge from-layer="3158" from-port="2" to-layer="3159" to-port="1" /> <edge from-layer="3159" from-port="2" to-layer="3178" to-port="0" /> <edge from-layer="3159" from-port="2" to-layer="3168" to-port="0" /> <edge from-layer="3160" from-port="0" to-layer="3161" to-port="0" /> <edge from-layer="3161" from-port="1" to-layer="3164" to-port="0" /> <edge from-layer="3162" from-port="0" to-layer="3163" to-port="0" /> <edge from-layer="3163" from-port="1" to-layer="3164" to-port="1" /> <edge from-layer="3164" from-port="2" to-layer="3166" to-port="0" /> <edge from-layer="3165" from-port="0" to-layer="3166" to-port="1" /> <edge from-layer="3166" from-port="2" to-layer="3167" to-port="0" /> <edge from-layer="3167" from-port="1" to-layer="3168" to-port="1" /> <edge from-layer="3168" from-port="2" to-layer="3169" to-port="0" /> <edge from-layer="3169" from-port="1" to-layer="3179" to-port="0" /> <edge from-layer="3170" from-port="0" to-layer="3171" to-port="0" /> <edge from-layer="3171" from-port="1" to-layer="3174" to-port="0" /> <edge from-layer="3172" from-port="0" to-layer="3173" to-port="0" /> <edge from-layer="3173" from-port="1" to-layer="3174" to-port="1" /> <edge from-layer="3174" from-port="2" to-layer="3176" to-port="0" /> <edge from-layer="3175" from-port="0" to-layer="3176" to-port="1" /> <edge from-layer="3176" from-port="2" to-layer="3177" to-port="0" /> <edge from-layer="3177" from-port="1" to-layer="3178" to-port="1" /> <edge from-layer="3178" from-port="2" to-layer="3179" to-port="1" /> <edge from-layer="3179" from-port="2" to-layer="3188" to-port="0" /> <edge from-layer="3180" from-port="0" to-layer="3181" to-port="0" /> <edge from-layer="3181" from-port="1" to-layer="3184" to-port="0" /> <edge from-layer="3182" from-port="0" to-layer="3183" to-port="0" /> <edge from-layer="3183" from-port="1" to-layer="3184" to-port="1" /> <edge from-layer="3184" from-port="2" to-layer="3186" to-port="0" /> <edge from-layer="3185" from-port="0" to-layer="3186" to-port="1" /> <edge from-layer="3186" from-port="2" to-layer="3187" to-port="0" /> <edge from-layer="3187" from-port="1" to-layer="3188" to-port="1" /> <edge from-layer="3188" from-port="2" to-layer="3189" to-port="1" /> <edge from-layer="3189" from-port="2" to-layer="3193" to-port="0" /> <edge from-layer="3189" from-port="2" to-layer="3200" to-port="0" /> <edge from-layer="3189" from-port="2" to-layer="3298" to-port="0" /> <edge from-layer="3190" from-port="0" to-layer="3201" to-port="0" /> <edge from-layer="3191" from-port="0" to-layer="3199" to-port="0" /> <edge from-layer="3192" from-port="0" to-layer="3193" to-port="1" /> <edge from-layer="3193" from-port="2" to-layer="3195" to-port="0" /> <edge from-layer="3194" from-port="0" to-layer="3195" to-port="1" /> <edge from-layer="3195" from-port="2" to-layer="3197" to-port="0" /> <edge from-layer="3196" from-port="0" to-layer="3197" to-port="1" /> <edge from-layer="3197" from-port="2" to-layer="3198" to-port="0" /> <edge from-layer="3198" from-port="1" to-layer="3199" to-port="1" /> <edge from-layer="3199" from-port="2" to-layer="3200" to-port="1" /> <edge from-layer="3200" from-port="2" to-layer="3201" to-port="1" /> <edge from-layer="3201" from-port="2" to-layer="3210" to-port="0" /> <edge from-layer="3201" from-port="2" to-layer="3240" to-port="0" /> <edge from-layer="3201" from-port="2" to-layer="3275" to-port="0" /> <edge from-layer="3202" from-port="0" to-layer="3203" to-port="0" /> <edge from-layer="3203" from-port="1" to-layer="3206" to-port="0" /> <edge from-layer="3204" from-port="0" to-layer="3205" to-port="0" /> <edge from-layer="3205" from-port="1" to-layer="3206" to-port="1" /> <edge from-layer="3206" from-port="2" to-layer="3208" to-port="0" /> <edge from-layer="3207" from-port="0" to-layer="3208" to-port="1" /> <edge from-layer="3208" from-port="2" to-layer="3209" to-port="0" /> <edge from-layer="3209" from-port="1" to-layer="3210" to-port="1" /> <edge from-layer="3210" from-port="2" to-layer="3212" to-port="0" /> <edge from-layer="3211" from-port="0" to-layer="3212" to-port="1" /> <edge from-layer="3212" from-port="2" to-layer="3214" to-port="0" /> <edge from-layer="3213" from-port="0" to-layer="3214" to-port="1" /> <edge from-layer="3214" from-port="2" to-layer="3215" to-port="0" /> <edge from-layer="3214" from-port="2" to-layer="3219" to-port="0" /> <edge from-layer="3214" from-port="2" to-layer="3225" to-port="0" /> <edge from-layer="3215" from-port="2" to-layer="3228" to-port="0" /> <edge from-layer="3216" from-port="0" to-layer="3219" to-port="1" /> <edge from-layer="3217" from-port="0" to-layer="3219" to-port="2" /> <edge from-layer="3218" from-port="0" to-layer="3219" to-port="3" /> <edge from-layer="3219" from-port="5" to-layer="3221" to-port="0" /> <edge from-layer="3220" from-port="0" to-layer="3221" to-port="1" /> <edge from-layer="3221" from-port="2" to-layer="3226" to-port="0" /> <edge from-layer="3222" from-port="0" to-layer="3225" to-port="1" /> <edge from-layer="3223" from-port="0" to-layer="3225" to-port="2" /> <edge from-layer="3224" from-port="0" to-layer="3225" to-port="3" /> <edge from-layer="3225" from-port="5" to-layer="3226" to-port="1" /> <edge from-layer="3226" from-port="2" to-layer="3227" to-port="0" /> <edge from-layer="3227" from-port="2" to-layer="3228" to-port="1" /> <edge from-layer="3228" from-port="2" to-layer="3285" to-port="0" /> <edge from-layer="3229" from-port="1" to-layer="3231" to-port="0" /> <edge from-layer="3230" from-port="0" to-layer="3231" to-port="2" /> <edge from-layer="3231" from-port="3" to-layer="3259" to-port="0" /> <edge from-layer="3232" from-port="0" to-layer="3233" to-port="0" /> <edge from-layer="3233" from-port="1" to-layer="3236" to-port="0" /> <edge from-layer="3234" from-port="0" to-layer="3235" to-port="0" /> <edge from-layer="3235" from-port="1" to-layer="3236" to-port="1" /> <edge from-layer="3236" from-port="2" to-layer="3238" to-port="0" /> <edge from-layer="3237" from-port="0" to-layer="3238" to-port="1" /> <edge from-layer="3238" from-port="2" to-layer="3239" to-port="0" /> <edge from-layer="3239" from-port="1" to-layer="3240" to-port="1" /> <edge from-layer="3240" from-port="2" to-layer="3242" to-port="0" /> <edge from-layer="3241" from-port="0" to-layer="3242" to-port="1" /> <edge from-layer="3242" from-port="2" to-layer="3244" to-port="0" /> <edge from-layer="3243" from-port="0" to-layer="3244" to-port="1" /> <edge from-layer="3244" from-port="2" to-layer="3245" to-port="0" /> <edge from-layer="3244" from-port="2" to-layer="3249" to-port="0" /> <edge from-layer="3244" from-port="2" to-layer="3255" to-port="0" /> <edge from-layer="3245" from-port="2" to-layer="3258" to-port="0" /> <edge from-layer="3246" from-port="0" to-layer="3249" to-port="1" /> <edge from-layer="3247" from-port="0" to-layer="3249" to-port="2" /> <edge from-layer="3248" from-port="0" to-layer="3249" to-port="3" /> <edge from-layer="3249" from-port="5" to-layer="3251" to-port="0" /> <edge from-layer="3250" from-port="0" to-layer="3251" to-port="1" /> <edge from-layer="3251" from-port="2" to-layer="3256" to-port="0" /> <edge from-layer="3252" from-port="0" to-layer="3255" to-port="1" /> <edge from-layer="3253" from-port="0" to-layer="3255" to-port="2" /> <edge from-layer="3254" from-port="0" to-layer="3255" to-port="3" /> <edge from-layer="3255" from-port="5" to-layer="3256" to-port="1" /> <edge from-layer="3256" from-port="2" to-layer="3257" to-port="0" /> <edge from-layer="3257" from-port="2" to-layer="3258" to-port="1" /> <edge from-layer="3258" from-port="2" to-layer="3259" to-port="1" /> <edge from-layer="3259" from-port="2" to-layer="6156" to-port="0" /> <edge from-layer="3259" from-port="2" to-layer="3260" to-port="0" /> <edge from-layer="3260" from-port="2" to-layer="3261" to-port="0" /> <edge from-layer="3261" from-port="2" to-layer="3263" to-port="0" /> <edge from-layer="3262" from-port="0" to-layer="3263" to-port="1" /> <edge from-layer="3263" from-port="2" to-layer="3285" to-port="1" /> <edge from-layer="3264" from-port="1" to-layer="3266" to-port="0" /> <edge from-layer="3265" from-port="0" to-layer="3266" to-port="2" /> <edge from-layer="3266" from-port="3" to-layer="3280" to-port="0" /> <edge from-layer="3267" from-port="0" to-layer="3268" to-port="0" /> <edge from-layer="3268" from-port="1" to-layer="3271" to-port="0" /> <edge from-layer="3269" from-port="0" to-layer="3270" to-port="0" /> <edge from-layer="3270" from-port="1" to-layer="3271" to-port="1" /> <edge from-layer="3271" from-port="2" to-layer="3273" to-port="0" /> <edge from-layer="3272" from-port="0" to-layer="3273" to-port="1" /> <edge from-layer="3273" from-port="2" to-layer="3274" to-port="0" /> <edge from-layer="3274" from-port="1" to-layer="3275" to-port="1" /> <edge from-layer="3275" from-port="2" to-layer="3277" to-port="0" /> <edge from-layer="3276" from-port="0" to-layer="3277" to-port="1" /> <edge from-layer="3277" from-port="2" to-layer="3279" to-port="0" /> <edge from-layer="3278" from-port="0" to-layer="3279" to-port="1" /> <edge from-layer="3279" from-port="2" to-layer="3280" to-port="1" /> <edge from-layer="3280" from-port="2" to-layer="3281" to-port="0" /> <edge from-layer="3280" from-port="2" to-layer="6155" to-port="0" /> <edge from-layer="3281" from-port="2" to-layer="3282" to-port="0" /> <edge from-layer="3282" from-port="2" to-layer="3284" to-port="0" /> <edge from-layer="3283" from-port="0" to-layer="3284" to-port="1" /> <edge from-layer="3284" from-port="2" to-layer="3285" to-port="2" /> <edge from-layer="3285" from-port="4" to-layer="3287" to-port="0" /> <edge from-layer="3286" from-port="0" to-layer="3287" to-port="1" /> <edge from-layer="3287" from-port="2" to-layer="3288" to-port="0" /> <edge from-layer="3288" from-port="2" to-layer="3297" to-port="0" /> <edge from-layer="3289" from-port="0" to-layer="3290" to-port="0" /> <edge from-layer="3290" from-port="1" to-layer="3293" to-port="0" /> <edge from-layer="3291" from-port="0" to-layer="3292" to-port="0" /> <edge from-layer="3292" from-port="1" to-layer="3293" to-port="1" /> <edge from-layer="3293" from-port="2" to-layer="3295" to-port="0" /> <edge from-layer="3294" from-port="0" to-layer="3295" to-port="1" /> <edge from-layer="3295" from-port="2" to-layer="3296" to-port="0" /> <edge from-layer="3296" from-port="1" to-layer="3297" to-port="1" /> <edge from-layer="3297" from-port="2" to-layer="3298" to-port="1" /> <edge from-layer="3298" from-port="2" to-layer="3340" to-port="0" /> <edge from-layer="3298" from-port="2" to-layer="3309" to-port="0" /> <edge from-layer="3298" from-port="2" to-layer="3302" to-port="0" /> <edge from-layer="3299" from-port="0" to-layer="3310" to-port="0" /> <edge from-layer="3300" from-port="0" to-layer="3308" to-port="0" /> <edge from-layer="3301" from-port="0" to-layer="3302" to-port="1" /> <edge from-layer="3302" from-port="2" to-layer="3304" to-port="0" /> <edge from-layer="3303" from-port="0" to-layer="3304" to-port="1" /> <edge from-layer="3304" from-port="2" to-layer="3306" to-port="0" /> <edge from-layer="3305" from-port="0" to-layer="3306" to-port="1" /> <edge from-layer="3306" from-port="2" to-layer="3307" to-port="0" /> <edge from-layer="3307" from-port="1" to-layer="3308" to-port="1" /> <edge from-layer="3308" from-port="2" to-layer="3309" to-port="1" /> <edge from-layer="3309" from-port="2" to-layer="3310" to-port="1" /> <edge from-layer="3310" from-port="2" to-layer="3329" to-port="0" /> <edge from-layer="3310" from-port="2" to-layer="3319" to-port="0" /> <edge from-layer="3311" from-port="0" to-layer="3312" to-port="0" /> <edge from-layer="3312" from-port="1" to-layer="3315" to-port="0" /> <edge from-layer="3313" from-port="0" to-layer="3314" to-port="0" /> <edge from-layer="3314" from-port="1" to-layer="3315" to-port="1" /> <edge from-layer="3315" from-port="2" to-layer="3317" to-port="0" /> <edge from-layer="3316" from-port="0" to-layer="3317" to-port="1" /> <edge from-layer="3317" from-port="2" to-layer="3318" to-port="0" /> <edge from-layer="3318" from-port="1" to-layer="3319" to-port="1" /> <edge from-layer="3319" from-port="2" to-layer="3320" to-port="0" /> <edge from-layer="3320" from-port="1" to-layer="3330" to-port="0" /> <edge from-layer="3321" from-port="0" to-layer="3322" to-port="0" /> <edge from-layer="3322" from-port="1" to-layer="3325" to-port="0" /> <edge from-layer="3323" from-port="0" to-layer="3324" to-port="0" /> <edge from-layer="3324" from-port="1" to-layer="3325" to-port="1" /> <edge from-layer="3325" from-port="2" to-layer="3327" to-port="0" /> <edge from-layer="3326" from-port="0" to-layer="3327" to-port="1" /> <edge from-layer="3327" from-port="2" to-layer="3328" to-port="0" /> <edge from-layer="3328" from-port="1" to-layer="3329" to-port="1" /> <edge from-layer="3329" from-port="2" to-layer="3330" to-port="1" /> <edge from-layer="3330" from-port="2" to-layer="3339" to-port="0" /> <edge from-layer="3331" from-port="0" to-layer="3332" to-port="0" /> <edge from-layer="3332" from-port="1" to-layer="3335" to-port="0" /> <edge from-layer="3333" from-port="0" to-layer="3334" to-port="0" /> <edge from-layer="3334" from-port="1" to-layer="3335" to-port="1" /> <edge from-layer="3335" from-port="2" to-layer="3337" to-port="0" /> <edge from-layer="3336" from-port="0" to-layer="3337" to-port="1" /> <edge from-layer="3337" from-port="2" to-layer="3338" to-port="0" /> <edge from-layer="3338" from-port="1" to-layer="3339" to-port="1" /> <edge from-layer="3339" from-port="2" to-layer="3340" to-port="1" /> <edge from-layer="3340" from-port="2" to-layer="3344" to-port="0" /> <edge from-layer="3340" from-port="2" to-layer="3449" to-port="0" /> <edge from-layer="3340" from-port="2" to-layer="3351" to-port="0" /> <edge from-layer="3341" from-port="0" to-layer="3352" to-port="0" /> <edge from-layer="3342" from-port="0" to-layer="3350" to-port="0" /> <edge from-layer="3343" from-port="0" to-layer="3344" to-port="1" /> <edge from-layer="3344" from-port="2" to-layer="3346" to-port="0" /> <edge from-layer="3345" from-port="0" to-layer="3346" to-port="1" /> <edge from-layer="3346" from-port="2" to-layer="3348" to-port="0" /> <edge from-layer="3347" from-port="0" to-layer="3348" to-port="1" /> <edge from-layer="3348" from-port="2" to-layer="3349" to-port="0" /> <edge from-layer="3349" from-port="1" to-layer="3350" to-port="1" /> <edge from-layer="3350" from-port="2" to-layer="3351" to-port="1" /> <edge from-layer="3351" from-port="2" to-layer="3352" to-port="1" /> <edge from-layer="3352" from-port="2" to-layer="3391" to-port="0" /> <edge from-layer="3352" from-port="2" to-layer="3426" to-port="0" /> <edge from-layer="3352" from-port="2" to-layer="3361" to-port="0" /> <edge from-layer="3353" from-port="0" to-layer="3354" to-port="0" /> <edge from-layer="3354" from-port="1" to-layer="3357" to-port="0" /> <edge from-layer="3355" from-port="0" to-layer="3356" to-port="0" /> <edge from-layer="3356" from-port="1" to-layer="3357" to-port="1" /> <edge from-layer="3357" from-port="2" to-layer="3359" to-port="0" /> <edge from-layer="3358" from-port="0" to-layer="3359" to-port="1" /> <edge from-layer="3359" from-port="2" to-layer="3360" to-port="0" /> <edge from-layer="3360" from-port="1" to-layer="3361" to-port="1" /> <edge from-layer="3361" from-port="2" to-layer="3363" to-port="0" /> <edge from-layer="3362" from-port="0" to-layer="3363" to-port="1" /> <edge from-layer="3363" from-port="2" to-layer="3365" to-port="0" /> <edge from-layer="3364" from-port="0" to-layer="3365" to-port="1" /> <edge from-layer="3365" from-port="2" to-layer="3370" to-port="0" /> <edge from-layer="3365" from-port="2" to-layer="3376" to-port="0" /> <edge from-layer="3365" from-port="2" to-layer="3366" to-port="0" /> <edge from-layer="3366" from-port="2" to-layer="3379" to-port="0" /> <edge from-layer="3367" from-port="0" to-layer="3370" to-port="1" /> <edge from-layer="3368" from-port="0" to-layer="3370" to-port="2" /> <edge from-layer="3369" from-port="0" to-layer="3370" to-port="3" /> <edge from-layer="3370" from-port="5" to-layer="3372" to-port="0" /> <edge from-layer="3371" from-port="0" to-layer="3372" to-port="1" /> <edge from-layer="3372" from-port="2" to-layer="3377" to-port="0" /> <edge from-layer="3373" from-port="0" to-layer="3376" to-port="1" /> <edge from-layer="3374" from-port="0" to-layer="3376" to-port="2" /> <edge from-layer="3375" from-port="0" to-layer="3376" to-port="3" /> <edge from-layer="3376" from-port="5" to-layer="3377" to-port="1" /> <edge from-layer="3377" from-port="2" to-layer="3378" to-port="0" /> <edge from-layer="3378" from-port="2" to-layer="3379" to-port="1" /> <edge from-layer="3379" from-port="2" to-layer="3436" to-port="0" /> <edge from-layer="3380" from-port="1" to-layer="3382" to-port="0" /> <edge from-layer="3381" from-port="0" to-layer="3382" to-port="2" /> <edge from-layer="3382" from-port="3" to-layer="3410" to-port="0" /> <edge from-layer="3383" from-port="0" to-layer="3384" to-port="0" /> <edge from-layer="3384" from-port="1" to-layer="3387" to-port="0" /> <edge from-layer="3385" from-port="0" to-layer="3386" to-port="0" /> <edge from-layer="3386" from-port="1" to-layer="3387" to-port="1" /> <edge from-layer="3387" from-port="2" to-layer="3389" to-port="0" /> <edge from-layer="3388" from-port="0" to-layer="3389" to-port="1" /> <edge from-layer="3389" from-port="2" to-layer="3390" to-port="0" /> <edge from-layer="3390" from-port="1" to-layer="3391" to-port="1" /> <edge from-layer="3391" from-port="2" to-layer="3393" to-port="0" /> <edge from-layer="3392" from-port="0" to-layer="3393" to-port="1" /> <edge from-layer="3393" from-port="2" to-layer="3395" to-port="0" /> <edge from-layer="3394" from-port="0" to-layer="3395" to-port="1" /> <edge from-layer="3395" from-port="2" to-layer="3406" to-port="0" /> <edge from-layer="3395" from-port="2" to-layer="3400" to-port="0" /> <edge from-layer="3395" from-port="2" to-layer="3396" to-port="0" /> <edge from-layer="3396" from-port="2" to-layer="3409" to-port="0" /> <edge from-layer="3397" from-port="0" to-layer="3400" to-port="1" /> <edge from-layer="3398" from-port="0" to-layer="3400" to-port="2" /> <edge from-layer="3399" from-port="0" to-layer="3400" to-port="3" /> <edge from-layer="3400" from-port="5" to-layer="3402" to-port="0" /> <edge from-layer="3401" from-port="0" to-layer="3402" to-port="1" /> <edge from-layer="3402" from-port="2" to-layer="3407" to-port="0" /> <edge from-layer="3403" from-port="0" to-layer="3406" to-port="1" /> <edge from-layer="3404" from-port="0" to-layer="3406" to-port="2" /> <edge from-layer="3405" from-port="0" to-layer="3406" to-port="3" /> <edge from-layer="3406" from-port="5" to-layer="3407" to-port="1" /> <edge from-layer="3407" from-port="2" to-layer="3408" to-port="0" /> <edge from-layer="3408" from-port="2" to-layer="3409" to-port="1" /> <edge from-layer="3409" from-port="2" to-layer="3410" to-port="1" /> <edge from-layer="3410" from-port="2" to-layer="6154" to-port="0" /> <edge from-layer="3410" from-port="2" to-layer="3411" to-port="0" /> <edge from-layer="3411" from-port="2" to-layer="3412" to-port="0" /> <edge from-layer="3412" from-port="2" to-layer="3414" to-port="0" /> <edge from-layer="3413" from-port="0" to-layer="3414" to-port="1" /> <edge from-layer="3414" from-port="2" to-layer="3436" to-port="1" /> <edge from-layer="3415" from-port="1" to-layer="3417" to-port="0" /> <edge from-layer="3416" from-port="0" to-layer="3417" to-port="2" /> <edge from-layer="3417" from-port="3" to-layer="3431" to-port="0" /> <edge from-layer="3418" from-port="0" to-layer="3419" to-port="0" /> <edge from-layer="3419" from-port="1" to-layer="3422" to-port="0" /> <edge from-layer="3420" from-port="0" to-layer="3421" to-port="0" /> <edge from-layer="3421" from-port="1" to-layer="3422" to-port="1" /> <edge from-layer="3422" from-port="2" to-layer="3424" to-port="0" /> <edge from-layer="3423" from-port="0" to-layer="3424" to-port="1" /> <edge from-layer="3424" from-port="2" to-layer="3425" to-port="0" /> <edge from-layer="3425" from-port="1" to-layer="3426" to-port="1" /> <edge from-layer="3426" from-port="2" to-layer="3428" to-port="0" /> <edge from-layer="3427" from-port="0" to-layer="3428" to-port="1" /> <edge from-layer="3428" from-port="2" to-layer="3430" to-port="0" /> <edge from-layer="3429" from-port="0" to-layer="3430" to-port="1" /> <edge from-layer="3430" from-port="2" to-layer="3431" to-port="1" /> <edge from-layer="3431" from-port="2" to-layer="6153" to-port="0" /> <edge from-layer="3431" from-port="2" to-layer="3432" to-port="0" /> <edge from-layer="3432" from-port="2" to-layer="3433" to-port="0" /> <edge from-layer="3433" from-port="2" to-layer="3435" to-port="0" /> <edge from-layer="3434" from-port="0" to-layer="3435" to-port="1" /> <edge from-layer="3435" from-port="2" to-layer="3436" to-port="2" /> <edge from-layer="3436" from-port="4" to-layer="3438" to-port="0" /> <edge from-layer="3437" from-port="0" to-layer="3438" to-port="1" /> <edge from-layer="3438" from-port="2" to-layer="3439" to-port="0" /> <edge from-layer="3439" from-port="2" to-layer="3448" to-port="0" /> <edge from-layer="3440" from-port="0" to-layer="3441" to-port="0" /> <edge from-layer="3441" from-port="1" to-layer="3444" to-port="0" /> <edge from-layer="3442" from-port="0" to-layer="3443" to-port="0" /> <edge from-layer="3443" from-port="1" to-layer="3444" to-port="1" /> <edge from-layer="3444" from-port="2" to-layer="3446" to-port="0" /> <edge from-layer="3445" from-port="0" to-layer="3446" to-port="1" /> <edge from-layer="3446" from-port="2" to-layer="3447" to-port="0" /> <edge from-layer="3447" from-port="1" to-layer="3448" to-port="1" /> <edge from-layer="3448" from-port="2" to-layer="3449" to-port="1" /> <edge from-layer="3449" from-port="2" to-layer="3460" to-port="0" /> <edge from-layer="3449" from-port="2" to-layer="3453" to-port="0" /> <edge from-layer="3449" from-port="2" to-layer="3491" to-port="0" /> <edge from-layer="3450" from-port="0" to-layer="3461" to-port="0" /> <edge from-layer="3451" from-port="0" to-layer="3459" to-port="0" /> <edge from-layer="3452" from-port="0" to-layer="3453" to-port="1" /> <edge from-layer="3453" from-port="2" to-layer="3455" to-port="0" /> <edge from-layer="3454" from-port="0" to-layer="3455" to-port="1" /> <edge from-layer="3455" from-port="2" to-layer="3457" to-port="0" /> <edge from-layer="3456" from-port="0" to-layer="3457" to-port="1" /> <edge from-layer="3457" from-port="2" to-layer="3458" to-port="0" /> <edge from-layer="3458" from-port="1" to-layer="3459" to-port="1" /> <edge from-layer="3459" from-port="2" to-layer="3460" to-port="1" /> <edge from-layer="3460" from-port="2" to-layer="3461" to-port="1" /> <edge from-layer="3461" from-port="2" to-layer="3480" to-port="0" /> <edge from-layer="3461" from-port="2" to-layer="3470" to-port="0" /> <edge from-layer="3462" from-port="0" to-layer="3463" to-port="0" /> <edge from-layer="3463" from-port="1" to-layer="3466" to-port="0" /> <edge from-layer="3464" from-port="0" to-layer="3465" to-port="0" /> <edge from-layer="3465" from-port="1" to-layer="3466" to-port="1" /> <edge from-layer="3466" from-port="2" to-layer="3468" to-port="0" /> <edge from-layer="3467" from-port="0" to-layer="3468" to-port="1" /> <edge from-layer="3468" from-port="2" to-layer="3469" to-port="0" /> <edge from-layer="3469" from-port="1" to-layer="3470" to-port="1" /> <edge from-layer="3470" from-port="2" to-layer="3471" to-port="0" /> <edge from-layer="3471" from-port="1" to-layer="3481" to-port="0" /> <edge from-layer="3472" from-port="0" to-layer="3473" to-port="0" /> <edge from-layer="3473" from-port="1" to-layer="3476" to-port="0" /> <edge from-layer="3474" from-port="0" to-layer="3475" to-port="0" /> <edge from-layer="3475" from-port="1" to-layer="3476" to-port="1" /> <edge from-layer="3476" from-port="2" to-layer="3478" to-port="0" /> <edge from-layer="3477" from-port="0" to-layer="3478" to-port="1" /> <edge from-layer="3478" from-port="2" to-layer="3479" to-port="0" /> <edge from-layer="3479" from-port="1" to-layer="3480" to-port="1" /> <edge from-layer="3480" from-port="2" to-layer="3481" to-port="1" /> <edge from-layer="3481" from-port="2" to-layer="3490" to-port="0" /> <edge from-layer="3482" from-port="0" to-layer="3483" to-port="0" /> <edge from-layer="3483" from-port="1" to-layer="3486" to-port="0" /> <edge from-layer="3484" from-port="0" to-layer="3485" to-port="0" /> <edge from-layer="3485" from-port="1" to-layer="3486" to-port="1" /> <edge from-layer="3486" from-port="2" to-layer="3488" to-port="0" /> <edge from-layer="3487" from-port="0" to-layer="3488" to-port="1" /> <edge from-layer="3488" from-port="2" to-layer="3489" to-port="0" /> <edge from-layer="3489" from-port="1" to-layer="3490" to-port="1" /> <edge from-layer="3490" from-port="2" to-layer="3491" to-port="1" /> <edge from-layer="3491" from-port="2" to-layer="3600" to-port="0" /> <edge from-layer="3491" from-port="2" to-layer="3502" to-port="0" /> <edge from-layer="3491" from-port="2" to-layer="3495" to-port="0" /> <edge from-layer="3492" from-port="0" to-layer="3503" to-port="0" /> <edge from-layer="3493" from-port="0" to-layer="3501" to-port="0" /> <edge from-layer="3494" from-port="0" to-layer="3495" to-port="1" /> <edge from-layer="3495" from-port="2" to-layer="3497" to-port="0" /> <edge from-layer="3496" from-port="0" to-layer="3497" to-port="1" /> <edge from-layer="3497" from-port="2" to-layer="3499" to-port="0" /> <edge from-layer="3498" from-port="0" to-layer="3499" to-port="1" /> <edge from-layer="3499" from-port="2" to-layer="3500" to-port="0" /> <edge from-layer="3500" from-port="1" to-layer="3501" to-port="1" /> <edge from-layer="3501" from-port="2" to-layer="3502" to-port="1" /> <edge from-layer="3502" from-port="2" to-layer="3503" to-port="1" /> <edge from-layer="3503" from-port="2" to-layer="3542" to-port="0" /> <edge from-layer="3503" from-port="2" to-layer="3577" to-port="0" /> <edge from-layer="3503" from-port="2" to-layer="3512" to-port="0" /> <edge from-layer="3504" from-port="0" to-layer="3505" to-port="0" /> <edge from-layer="3505" from-port="1" to-layer="3508" to-port="0" /> <edge from-layer="3506" from-port="0" to-layer="3507" to-port="0" /> <edge from-layer="3507" from-port="1" to-layer="3508" to-port="1" /> <edge from-layer="3508" from-port="2" to-layer="3510" to-port="0" /> <edge from-layer="3509" from-port="0" to-layer="3510" to-port="1" /> <edge from-layer="3510" from-port="2" to-layer="3511" to-port="0" /> <edge from-layer="3511" from-port="1" to-layer="3512" to-port="1" /> <edge from-layer="3512" from-port="2" to-layer="3514" to-port="0" /> <edge from-layer="3513" from-port="0" to-layer="3514" to-port="1" /> <edge from-layer="3514" from-port="2" to-layer="3516" to-port="0" /> <edge from-layer="3515" from-port="0" to-layer="3516" to-port="1" /> <edge from-layer="3516" from-port="2" to-layer="3517" to-port="0" /> <edge from-layer="3516" from-port="2" to-layer="3527" to-port="0" /> <edge from-layer="3516" from-port="2" to-layer="3521" to-port="0" /> <edge from-layer="3517" from-port="2" to-layer="3530" to-port="0" /> <edge from-layer="3518" from-port="0" to-layer="3521" to-port="1" /> <edge from-layer="3519" from-port="0" to-layer="3521" to-port="2" /> <edge from-layer="3520" from-port="0" to-layer="3521" to-port="3" /> <edge from-layer="3521" from-port="5" to-layer="3523" to-port="0" /> <edge from-layer="3522" from-port="0" to-layer="3523" to-port="1" /> <edge from-layer="3523" from-port="2" to-layer="3528" to-port="0" /> <edge from-layer="3524" from-port="0" to-layer="3527" to-port="1" /> <edge from-layer="3525" from-port="0" to-layer="3527" to-port="2" /> <edge from-layer="3526" from-port="0" to-layer="3527" to-port="3" /> <edge from-layer="3527" from-port="5" to-layer="3528" to-port="1" /> <edge from-layer="3528" from-port="2" to-layer="3529" to-port="0" /> <edge from-layer="3529" from-port="2" to-layer="3530" to-port="1" /> <edge from-layer="3530" from-port="2" to-layer="3587" to-port="0" /> <edge from-layer="3531" from-port="1" to-layer="3533" to-port="0" /> <edge from-layer="3532" from-port="0" to-layer="3533" to-port="2" /> <edge from-layer="3533" from-port="3" to-layer="3561" to-port="0" /> <edge from-layer="3534" from-port="0" to-layer="3535" to-port="0" /> <edge from-layer="3535" from-port="1" to-layer="3538" to-port="0" /> <edge from-layer="3536" from-port="0" to-layer="3537" to-port="0" /> <edge from-layer="3537" from-port="1" to-layer="3538" to-port="1" /> <edge from-layer="3538" from-port="2" to-layer="3540" to-port="0" /> <edge from-layer="3539" from-port="0" to-layer="3540" to-port="1" /> <edge from-layer="3540" from-port="2" to-layer="3541" to-port="0" /> <edge from-layer="3541" from-port="1" to-layer="3542" to-port="1" /> <edge from-layer="3542" from-port="2" to-layer="3544" to-port="0" /> <edge from-layer="3543" from-port="0" to-layer="3544" to-port="1" /> <edge from-layer="3544" from-port="2" to-layer="3546" to-port="0" /> <edge from-layer="3545" from-port="0" to-layer="3546" to-port="1" /> <edge from-layer="3546" from-port="2" to-layer="3547" to-port="0" /> <edge from-layer="3546" from-port="2" to-layer="3551" to-port="0" /> <edge from-layer="3546" from-port="2" to-layer="3557" to-port="0" /> <edge from-layer="3547" from-port="2" to-layer="3560" to-port="0" /> <edge from-layer="3548" from-port="0" to-layer="3551" to-port="1" /> <edge from-layer="3549" from-port="0" to-layer="3551" to-port="2" /> <edge from-layer="3550" from-port="0" to-layer="3551" to-port="3" /> <edge from-layer="3551" from-port="5" to-layer="3553" to-port="0" /> <edge from-layer="3552" from-port="0" to-layer="3553" to-port="1" /> <edge from-layer="3553" from-port="2" to-layer="3558" to-port="0" /> <edge from-layer="3554" from-port="0" to-layer="3557" to-port="1" /> <edge from-layer="3555" from-port="0" to-layer="3557" to-port="2" /> <edge from-layer="3556" from-port="0" to-layer="3557" to-port="3" /> <edge from-layer="3557" from-port="5" to-layer="3558" to-port="1" /> <edge from-layer="3558" from-port="2" to-layer="3559" to-port="0" /> <edge from-layer="3559" from-port="2" to-layer="3560" to-port="1" /> <edge from-layer="3560" from-port="2" to-layer="3561" to-port="1" /> <edge from-layer="3561" from-port="2" to-layer="6152" to-port="0" /> <edge from-layer="3561" from-port="2" to-layer="3562" to-port="0" /> <edge from-layer="3562" from-port="2" to-layer="3563" to-port="0" /> <edge from-layer="3563" from-port="2" to-layer="3565" to-port="0" /> <edge from-layer="3564" from-port="0" to-layer="3565" to-port="1" /> <edge from-layer="3565" from-port="2" to-layer="3587" to-port="1" /> <edge from-layer="3566" from-port="1" to-layer="3568" to-port="0" /> <edge from-layer="3567" from-port="0" to-layer="3568" to-port="2" /> <edge from-layer="3568" from-port="3" to-layer="3582" to-port="0" /> <edge from-layer="3569" from-port="0" to-layer="3570" to-port="0" /> <edge from-layer="3570" from-port="1" to-layer="3573" to-port="0" /> <edge from-layer="3571" from-port="0" to-layer="3572" to-port="0" /> <edge from-layer="3572" from-port="1" to-layer="3573" to-port="1" /> <edge from-layer="3573" from-port="2" to-layer="3575" to-port="0" /> <edge from-layer="3574" from-port="0" to-layer="3575" to-port="1" /> <edge from-layer="3575" from-port="2" to-layer="3576" to-port="0" /> <edge from-layer="3576" from-port="1" to-layer="3577" to-port="1" /> <edge from-layer="3577" from-port="2" to-layer="3579" to-port="0" /> <edge from-layer="3578" from-port="0" to-layer="3579" to-port="1" /> <edge from-layer="3579" from-port="2" to-layer="3581" to-port="0" /> <edge from-layer="3580" from-port="0" to-layer="3581" to-port="1" /> <edge from-layer="3581" from-port="2" to-layer="3582" to-port="1" /> <edge from-layer="3582" from-port="2" to-layer="6151" to-port="0" /> <edge from-layer="3582" from-port="2" to-layer="3583" to-port="0" /> <edge from-layer="3583" from-port="2" to-layer="3584" to-port="0" /> <edge from-layer="3584" from-port="2" to-layer="3586" to-port="0" /> <edge from-layer="3585" from-port="0" to-layer="3586" to-port="1" /> <edge from-layer="3586" from-port="2" to-layer="3587" to-port="2" /> <edge from-layer="3587" from-port="4" to-layer="3589" to-port="0" /> <edge from-layer="3588" from-port="0" to-layer="3589" to-port="1" /> <edge from-layer="3589" from-port="2" to-layer="3590" to-port="0" /> <edge from-layer="3590" from-port="2" to-layer="3599" to-port="0" /> <edge from-layer="3591" from-port="0" to-layer="3592" to-port="0" /> <edge from-layer="3592" from-port="1" to-layer="3595" to-port="0" /> <edge from-layer="3593" from-port="0" to-layer="3594" to-port="0" /> <edge from-layer="3594" from-port="1" to-layer="3595" to-port="1" /> <edge from-layer="3595" from-port="2" to-layer="3597" to-port="0" /> <edge from-layer="3596" from-port="0" to-layer="3597" to-port="1" /> <edge from-layer="3597" from-port="2" to-layer="3598" to-port="0" /> <edge from-layer="3598" from-port="1" to-layer="3599" to-port="1" /> <edge from-layer="3599" from-port="2" to-layer="3600" to-port="1" /> <edge from-layer="3600" from-port="2" to-layer="3604" to-port="0" /> <edge from-layer="3600" from-port="2" to-layer="3642" to-port="0" /> <edge from-layer="3600" from-port="2" to-layer="3611" to-port="0" /> <edge from-layer="3601" from-port="0" to-layer="3612" to-port="0" /> <edge from-layer="3602" from-port="0" to-layer="3610" to-port="0" /> <edge from-layer="3603" from-port="0" to-layer="3604" to-port="1" /> <edge from-layer="3604" from-port="2" to-layer="3606" to-port="0" /> <edge from-layer="3605" from-port="0" to-layer="3606" to-port="1" /> <edge from-layer="3606" from-port="2" to-layer="3608" to-port="0" /> <edge from-layer="3607" from-port="0" to-layer="3608" to-port="1" /> <edge from-layer="3608" from-port="2" to-layer="3609" to-port="0" /> <edge from-layer="3609" from-port="1" to-layer="3610" to-port="1" /> <edge from-layer="3610" from-port="2" to-layer="3611" to-port="1" /> <edge from-layer="3611" from-port="2" to-layer="3612" to-port="1" /> <edge from-layer="3612" from-port="2" to-layer="3631" to-port="0" /> <edge from-layer="3612" from-port="2" to-layer="3621" to-port="0" /> <edge from-layer="3613" from-port="0" to-layer="3614" to-port="0" /> <edge from-layer="3614" from-port="1" to-layer="3617" to-port="0" /> <edge from-layer="3615" from-port="0" to-layer="3616" to-port="0" /> <edge from-layer="3616" from-port="1" to-layer="3617" to-port="1" /> <edge from-layer="3617" from-port="2" to-layer="3619" to-port="0" /> <edge from-layer="3618" from-port="0" to-layer="3619" to-port="1" /> <edge from-layer="3619" from-port="2" to-layer="3620" to-port="0" /> <edge from-layer="3620" from-port="1" to-layer="3621" to-port="1" /> <edge from-layer="3621" from-port="2" to-layer="3622" to-port="0" /> <edge from-layer="3622" from-port="1" to-layer="3632" to-port="0" /> <edge from-layer="3623" from-port="0" to-layer="3624" to-port="0" /> <edge from-layer="3624" from-port="1" to-layer="3627" to-port="0" /> <edge from-layer="3625" from-port="0" to-layer="3626" to-port="0" /> <edge from-layer="3626" from-port="1" to-layer="3627" to-port="1" /> <edge from-layer="3627" from-port="2" to-layer="3629" to-port="0" /> <edge from-layer="3628" from-port="0" to-layer="3629" to-port="1" /> <edge from-layer="3629" from-port="2" to-layer="3630" to-port="0" /> <edge from-layer="3630" from-port="1" to-layer="3631" to-port="1" /> <edge from-layer="3631" from-port="2" to-layer="3632" to-port="1" /> <edge from-layer="3632" from-port="2" to-layer="3641" to-port="0" /> <edge from-layer="3633" from-port="0" to-layer="3634" to-port="0" /> <edge from-layer="3634" from-port="1" to-layer="3637" to-port="0" /> <edge from-layer="3635" from-port="0" to-layer="3636" to-port="0" /> <edge from-layer="3636" from-port="1" to-layer="3637" to-port="1" /> <edge from-layer="3637" from-port="2" to-layer="3639" to-port="0" /> <edge from-layer="3638" from-port="0" to-layer="3639" to-port="1" /> <edge from-layer="3639" from-port="2" to-layer="3640" to-port="0" /> <edge from-layer="3640" from-port="1" to-layer="3641" to-port="1" /> <edge from-layer="3641" from-port="2" to-layer="3642" to-port="1" /> <edge from-layer="3642" from-port="2" to-layer="3751" to-port="0" /> <edge from-layer="3642" from-port="2" to-layer="3646" to-port="0" /> <edge from-layer="3642" from-port="2" to-layer="3653" to-port="0" /> <edge from-layer="3643" from-port="0" to-layer="3654" to-port="0" /> <edge from-layer="3644" from-port="0" to-layer="3652" to-port="0" /> <edge from-layer="3645" from-port="0" to-layer="3646" to-port="1" /> <edge from-layer="3646" from-port="2" to-layer="3648" to-port="0" /> <edge from-layer="3647" from-port="0" to-layer="3648" to-port="1" /> <edge from-layer="3648" from-port="2" to-layer="3650" to-port="0" /> <edge from-layer="3649" from-port="0" to-layer="3650" to-port="1" /> <edge from-layer="3650" from-port="2" to-layer="3651" to-port="0" /> <edge from-layer="3651" from-port="1" to-layer="3652" to-port="1" /> <edge from-layer="3652" from-port="2" to-layer="3653" to-port="1" /> <edge from-layer="3653" from-port="2" to-layer="3654" to-port="1" /> <edge from-layer="3654" from-port="2" to-layer="3663" to-port="0" /> <edge from-layer="3654" from-port="2" to-layer="3728" to-port="0" /> <edge from-layer="3654" from-port="2" to-layer="3693" to-port="0" /> <edge from-layer="3655" from-port="0" to-layer="3656" to-port="0" /> <edge from-layer="3656" from-port="1" to-layer="3659" to-port="0" /> <edge from-layer="3657" from-port="0" to-layer="3658" to-port="0" /> <edge from-layer="3658" from-port="1" to-layer="3659" to-port="1" /> <edge from-layer="3659" from-port="2" to-layer="3661" to-port="0" /> <edge from-layer="3660" from-port="0" to-layer="3661" to-port="1" /> <edge from-layer="3661" from-port="2" to-layer="3662" to-port="0" /> <edge from-layer="3662" from-port="1" to-layer="3663" to-port="1" /> <edge from-layer="3663" from-port="2" to-layer="3665" to-port="0" /> <edge from-layer="3664" from-port="0" to-layer="3665" to-port="1" /> <edge from-layer="3665" from-port="2" to-layer="3667" to-port="0" /> <edge from-layer="3666" from-port="0" to-layer="3667" to-port="1" /> <edge from-layer="3667" from-port="2" to-layer="3672" to-port="0" /> <edge from-layer="3667" from-port="2" to-layer="3668" to-port="0" /> <edge from-layer="3667" from-port="2" to-layer="3678" to-port="0" /> <edge from-layer="3668" from-port="2" to-layer="3681" to-port="0" /> <edge from-layer="3669" from-port="0" to-layer="3672" to-port="1" /> <edge from-layer="3670" from-port="0" to-layer="3672" to-port="2" /> <edge from-layer="3671" from-port="0" to-layer="3672" to-port="3" /> <edge from-layer="3672" from-port="5" to-layer="3674" to-port="0" /> <edge from-layer="3673" from-port="0" to-layer="3674" to-port="1" /> <edge from-layer="3674" from-port="2" to-layer="3679" to-port="0" /> <edge from-layer="3675" from-port="0" to-layer="3678" to-port="1" /> <edge from-layer="3676" from-port="0" to-layer="3678" to-port="2" /> <edge from-layer="3677" from-port="0" to-layer="3678" to-port="3" /> <edge from-layer="3678" from-port="5" to-layer="3679" to-port="1" /> <edge from-layer="3679" from-port="2" to-layer="3680" to-port="0" /> <edge from-layer="3680" from-port="2" to-layer="3681" to-port="1" /> <edge from-layer="3681" from-port="2" to-layer="3738" to-port="0" /> <edge from-layer="3682" from-port="1" to-layer="3684" to-port="0" /> <edge from-layer="3683" from-port="0" to-layer="3684" to-port="2" /> <edge from-layer="3684" from-port="3" to-layer="3712" to-port="0" /> <edge from-layer="3685" from-port="0" to-layer="3686" to-port="0" /> <edge from-layer="3686" from-port="1" to-layer="3689" to-port="0" /> <edge from-layer="3687" from-port="0" to-layer="3688" to-port="0" /> <edge from-layer="3688" from-port="1" to-layer="3689" to-port="1" /> <edge from-layer="3689" from-port="2" to-layer="3691" to-port="0" /> <edge from-layer="3690" from-port="0" to-layer="3691" to-port="1" /> <edge from-layer="3691" from-port="2" to-layer="3692" to-port="0" /> <edge from-layer="3692" from-port="1" to-layer="3693" to-port="1" /> <edge from-layer="3693" from-port="2" to-layer="3695" to-port="0" /> <edge from-layer="3694" from-port="0" to-layer="3695" to-port="1" /> <edge from-layer="3695" from-port="2" to-layer="3697" to-port="0" /> <edge from-layer="3696" from-port="0" to-layer="3697" to-port="1" /> <edge from-layer="3697" from-port="2" to-layer="3708" to-port="0" /> <edge from-layer="3697" from-port="2" to-layer="3698" to-port="0" /> <edge from-layer="3697" from-port="2" to-layer="3702" to-port="0" /> <edge from-layer="3698" from-port="2" to-layer="3711" to-port="0" /> <edge from-layer="3699" from-port="0" to-layer="3702" to-port="1" /> <edge from-layer="3700" from-port="0" to-layer="3702" to-port="2" /> <edge from-layer="3701" from-port="0" to-layer="3702" to-port="3" /> <edge from-layer="3702" from-port="5" to-layer="3704" to-port="0" /> <edge from-layer="3703" from-port="0" to-layer="3704" to-port="1" /> <edge from-layer="3704" from-port="2" to-layer="3709" to-port="0" /> <edge from-layer="3705" from-port="0" to-layer="3708" to-port="1" /> <edge from-layer="3706" from-port="0" to-layer="3708" to-port="2" /> <edge from-layer="3707" from-port="0" to-layer="3708" to-port="3" /> <edge from-layer="3708" from-port="5" to-layer="3709" to-port="1" /> <edge from-layer="3709" from-port="2" to-layer="3710" to-port="0" /> <edge from-layer="3710" from-port="2" to-layer="3711" to-port="1" /> <edge from-layer="3711" from-port="2" to-layer="3712" to-port="1" /> <edge from-layer="3712" from-port="2" to-layer="3713" to-port="0" /> <edge from-layer="3712" from-port="2" to-layer="6150" to-port="0" /> <edge from-layer="3713" from-port="2" to-layer="3714" to-port="0" /> <edge from-layer="3714" from-port="2" to-layer="3716" to-port="0" /> <edge from-layer="3715" from-port="0" to-layer="3716" to-port="1" /> <edge from-layer="3716" from-port="2" to-layer="3738" to-port="1" /> <edge from-layer="3717" from-port="1" to-layer="3719" to-port="0" /> <edge from-layer="3718" from-port="0" to-layer="3719" to-port="2" /> <edge from-layer="3719" from-port="3" to-layer="3733" to-port="0" /> <edge from-layer="3720" from-port="0" to-layer="3721" to-port="0" /> <edge from-layer="3721" from-port="1" to-layer="3724" to-port="0" /> <edge from-layer="3722" from-port="0" to-layer="3723" to-port="0" /> <edge from-layer="3723" from-port="1" to-layer="3724" to-port="1" /> <edge from-layer="3724" from-port="2" to-layer="3726" to-port="0" /> <edge from-layer="3725" from-port="0" to-layer="3726" to-port="1" /> <edge from-layer="3726" from-port="2" to-layer="3727" to-port="0" /> <edge from-layer="3727" from-port="1" to-layer="3728" to-port="1" /> <edge from-layer="3728" from-port="2" to-layer="3730" to-port="0" /> <edge from-layer="3729" from-port="0" to-layer="3730" to-port="1" /> <edge from-layer="3730" from-port="2" to-layer="3732" to-port="0" /> <edge from-layer="3731" from-port="0" to-layer="3732" to-port="1" /> <edge from-layer="3732" from-port="2" to-layer="3733" to-port="1" /> <edge from-layer="3733" from-port="2" to-layer="3734" to-port="0" /> <edge from-layer="3733" from-port="2" to-layer="6149" to-port="0" /> <edge from-layer="3734" from-port="2" to-layer="3735" to-port="0" /> <edge from-layer="3735" from-port="2" to-layer="3737" to-port="0" /> <edge from-layer="3736" from-port="0" to-layer="3737" to-port="1" /> <edge from-layer="3737" from-port="2" to-layer="3738" to-port="2" /> <edge from-layer="3738" from-port="4" to-layer="3740" to-port="0" /> <edge from-layer="3739" from-port="0" to-layer="3740" to-port="1" /> <edge from-layer="3740" from-port="2" to-layer="3741" to-port="0" /> <edge from-layer="3741" from-port="2" to-layer="3750" to-port="0" /> <edge from-layer="3742" from-port="0" to-layer="3743" to-port="0" /> <edge from-layer="3743" from-port="1" to-layer="3746" to-port="0" /> <edge from-layer="3744" from-port="0" to-layer="3745" to-port="0" /> <edge from-layer="3745" from-port="1" to-layer="3746" to-port="1" /> <edge from-layer="3746" from-port="2" to-layer="3748" to-port="0" /> <edge from-layer="3747" from-port="0" to-layer="3748" to-port="1" /> <edge from-layer="3748" from-port="2" to-layer="3749" to-port="0" /> <edge from-layer="3749" from-port="1" to-layer="3750" to-port="1" /> <edge from-layer="3750" from-port="2" to-layer="3751" to-port="1" /> <edge from-layer="3751" from-port="2" to-layer="3762" to-port="0" /> <edge from-layer="3751" from-port="2" to-layer="3793" to-port="0" /> <edge from-layer="3751" from-port="2" to-layer="3755" to-port="0" /> <edge from-layer="3752" from-port="0" to-layer="3763" to-port="0" /> <edge from-layer="3753" from-port="0" to-layer="3761" to-port="0" /> <edge from-layer="3754" from-port="0" to-layer="3755" to-port="1" /> <edge from-layer="3755" from-port="2" to-layer="3757" to-port="0" /> <edge from-layer="3756" from-port="0" to-layer="3757" to-port="1" /> <edge from-layer="3757" from-port="2" to-layer="3759" to-port="0" /> <edge from-layer="3758" from-port="0" to-layer="3759" to-port="1" /> <edge from-layer="3759" from-port="2" to-layer="3760" to-port="0" /> <edge from-layer="3760" from-port="1" to-layer="3761" to-port="1" /> <edge from-layer="3761" from-port="2" to-layer="3762" to-port="1" /> <edge from-layer="3762" from-port="2" to-layer="3763" to-port="1" /> <edge from-layer="3763" from-port="2" to-layer="3772" to-port="0" /> <edge from-layer="3763" from-port="2" to-layer="3782" to-port="0" /> <edge from-layer="3764" from-port="0" to-layer="3765" to-port="0" /> <edge from-layer="3765" from-port="1" to-layer="3768" to-port="0" /> <edge from-layer="3766" from-port="0" to-layer="3767" to-port="0" /> <edge from-layer="3767" from-port="1" to-layer="3768" to-port="1" /> <edge from-layer="3768" from-port="2" to-layer="3770" to-port="0" /> <edge from-layer="3769" from-port="0" to-layer="3770" to-port="1" /> <edge from-layer="3770" from-port="2" to-layer="3771" to-port="0" /> <edge from-layer="3771" from-port="1" to-layer="3772" to-port="1" /> <edge from-layer="3772" from-port="2" to-layer="3773" to-port="0" /> <edge from-layer="3773" from-port="1" to-layer="3783" to-port="0" /> <edge from-layer="3774" from-port="0" to-layer="3775" to-port="0" /> <edge from-layer="3775" from-port="1" to-layer="3778" to-port="0" /> <edge from-layer="3776" from-port="0" to-layer="3777" to-port="0" /> <edge from-layer="3777" from-port="1" to-layer="3778" to-port="1" /> <edge from-layer="3778" from-port="2" to-layer="3780" to-port="0" /> <edge from-layer="3779" from-port="0" to-layer="3780" to-port="1" /> <edge from-layer="3780" from-port="2" to-layer="3781" to-port="0" /> <edge from-layer="3781" from-port="1" to-layer="3782" to-port="1" /> <edge from-layer="3782" from-port="2" to-layer="3783" to-port="1" /> <edge from-layer="3783" from-port="2" to-layer="3792" to-port="0" /> <edge from-layer="3784" from-port="0" to-layer="3785" to-port="0" /> <edge from-layer="3785" from-port="1" to-layer="3788" to-port="0" /> <edge from-layer="3786" from-port="0" to-layer="3787" to-port="0" /> <edge from-layer="3787" from-port="1" to-layer="3788" to-port="1" /> <edge from-layer="3788" from-port="2" to-layer="3790" to-port="0" /> <edge from-layer="3789" from-port="0" to-layer="3790" to-port="1" /> <edge from-layer="3790" from-port="2" to-layer="3791" to-port="0" /> <edge from-layer="3791" from-port="1" to-layer="3792" to-port="1" /> <edge from-layer="3792" from-port="2" to-layer="3793" to-port="1" /> <edge from-layer="3793" from-port="2" to-layer="3902" to-port="0" /> <edge from-layer="3793" from-port="2" to-layer="3804" to-port="0" /> <edge from-layer="3793" from-port="2" to-layer="3797" to-port="0" /> <edge from-layer="3794" from-port="0" to-layer="3805" to-port="0" /> <edge from-layer="3795" from-port="0" to-layer="3803" to-port="0" /> <edge from-layer="3796" from-port="0" to-layer="3797" to-port="1" /> <edge from-layer="3797" from-port="2" to-layer="3799" to-port="0" /> <edge from-layer="3798" from-port="0" to-layer="3799" to-port="1" /> <edge from-layer="3799" from-port="2" to-layer="3801" to-port="0" /> <edge from-layer="3800" from-port="0" to-layer="3801" to-port="1" /> <edge from-layer="3801" from-port="2" to-layer="3802" to-port="0" /> <edge from-layer="3802" from-port="1" to-layer="3803" to-port="1" /> <edge from-layer="3803" from-port="2" to-layer="3804" to-port="1" /> <edge from-layer="3804" from-port="2" to-layer="3805" to-port="1" /> <edge from-layer="3805" from-port="2" to-layer="3879" to-port="0" /> <edge from-layer="3805" from-port="2" to-layer="3844" to-port="0" /> <edge from-layer="3805" from-port="2" to-layer="3814" to-port="0" /> <edge from-layer="3806" from-port="0" to-layer="3807" to-port="0" /> <edge from-layer="3807" from-port="1" to-layer="3810" to-port="0" /> <edge from-layer="3808" from-port="0" to-layer="3809" to-port="0" /> <edge from-layer="3809" from-port="1" to-layer="3810" to-port="1" /> <edge from-layer="3810" from-port="2" to-layer="3812" to-port="0" /> <edge from-layer="3811" from-port="0" to-layer="3812" to-port="1" /> <edge from-layer="3812" from-port="2" to-layer="3813" to-port="0" /> <edge from-layer="3813" from-port="1" to-layer="3814" to-port="1" /> <edge from-layer="3814" from-port="2" to-layer="3816" to-port="0" /> <edge from-layer="3815" from-port="0" to-layer="3816" to-port="1" /> <edge from-layer="3816" from-port="2" to-layer="3818" to-port="0" /> <edge from-layer="3817" from-port="0" to-layer="3818" to-port="1" /> <edge from-layer="3818" from-port="2" to-layer="3819" to-port="0" /> <edge from-layer="3818" from-port="2" to-layer="3829" to-port="0" /> <edge from-layer="3818" from-port="2" to-layer="3823" to-port="0" /> <edge from-layer="3819" from-port="2" to-layer="3832" to-port="0" /> <edge from-layer="3820" from-port="0" to-layer="3823" to-port="1" /> <edge from-layer="3821" from-port="0" to-layer="3823" to-port="2" /> <edge from-layer="3822" from-port="0" to-layer="3823" to-port="3" /> <edge from-layer="3823" from-port="5" to-layer="3825" to-port="0" /> <edge from-layer="3824" from-port="0" to-layer="3825" to-port="1" /> <edge from-layer="3825" from-port="2" to-layer="3830" to-port="0" /> <edge from-layer="3826" from-port="0" to-layer="3829" to-port="1" /> <edge from-layer="3827" from-port="0" to-layer="3829" to-port="2" /> <edge from-layer="3828" from-port="0" to-layer="3829" to-port="3" /> <edge from-layer="3829" from-port="5" to-layer="3830" to-port="1" /> <edge from-layer="3830" from-port="2" to-layer="3831" to-port="0" /> <edge from-layer="3831" from-port="2" to-layer="3832" to-port="1" /> <edge from-layer="3832" from-port="2" to-layer="3889" to-port="0" /> <edge from-layer="3833" from-port="1" to-layer="3835" to-port="0" /> <edge from-layer="3834" from-port="0" to-layer="3835" to-port="2" /> <edge from-layer="3835" from-port="3" to-layer="3863" to-port="0" /> <edge from-layer="3836" from-port="0" to-layer="3837" to-port="0" /> <edge from-layer="3837" from-port="1" to-layer="3840" to-port="0" /> <edge from-layer="3838" from-port="0" to-layer="3839" to-port="0" /> <edge from-layer="3839" from-port="1" to-layer="3840" to-port="1" /> <edge from-layer="3840" from-port="2" to-layer="3842" to-port="0" /> <edge from-layer="3841" from-port="0" to-layer="3842" to-port="1" /> <edge from-layer="3842" from-port="2" to-layer="3843" to-port="0" /> <edge from-layer="3843" from-port="1" to-layer="3844" to-port="1" /> <edge from-layer="3844" from-port="2" to-layer="3846" to-port="0" /> <edge from-layer="3845" from-port="0" to-layer="3846" to-port="1" /> <edge from-layer="3846" from-port="2" to-layer="3848" to-port="0" /> <edge from-layer="3847" from-port="0" to-layer="3848" to-port="1" /> <edge from-layer="3848" from-port="2" to-layer="3849" to-port="0" /> <edge from-layer="3848" from-port="2" to-layer="3853" to-port="0" /> <edge from-layer="3848" from-port="2" to-layer="3859" to-port="0" /> <edge from-layer="3849" from-port="2" to-layer="3862" to-port="0" /> <edge from-layer="3850" from-port="0" to-layer="3853" to-port="1" /> <edge from-layer="3851" from-port="0" to-layer="3853" to-port="2" /> <edge from-layer="3852" from-port="0" to-layer="3853" to-port="3" /> <edge from-layer="3853" from-port="5" to-layer="3855" to-port="0" /> <edge from-layer="3854" from-port="0" to-layer="3855" to-port="1" /> <edge from-layer="3855" from-port="2" to-layer="3860" to-port="0" /> <edge from-layer="3856" from-port="0" to-layer="3859" to-port="1" /> <edge from-layer="3857" from-port="0" to-layer="3859" to-port="2" /> <edge from-layer="3858" from-port="0" to-layer="3859" to-port="3" /> <edge from-layer="3859" from-port="5" to-layer="3860" to-port="1" /> <edge from-layer="3860" from-port="2" to-layer="3861" to-port="0" /> <edge from-layer="3861" from-port="2" to-layer="3862" to-port="1" /> <edge from-layer="3862" from-port="2" to-layer="3863" to-port="1" /> <edge from-layer="3863" from-port="2" to-layer="6148" to-port="0" /> <edge from-layer="3863" from-port="2" to-layer="3864" to-port="0" /> <edge from-layer="3864" from-port="2" to-layer="3865" to-port="0" /> <edge from-layer="3865" from-port="2" to-layer="3867" to-port="0" /> <edge from-layer="3866" from-port="0" to-layer="3867" to-port="1" /> <edge from-layer="3867" from-port="2" to-layer="3889" to-port="1" /> <edge from-layer="3868" from-port="1" to-layer="3870" to-port="0" /> <edge from-layer="3869" from-port="0" to-layer="3870" to-port="2" /> <edge from-layer="3870" from-port="3" to-layer="3884" to-port="0" /> <edge from-layer="3871" from-port="0" to-layer="3872" to-port="0" /> <edge from-layer="3872" from-port="1" to-layer="3875" to-port="0" /> <edge from-layer="3873" from-port="0" to-layer="3874" to-port="0" /> <edge from-layer="3874" from-port="1" to-layer="3875" to-port="1" /> <edge from-layer="3875" from-port="2" to-layer="3877" to-port="0" /> <edge from-layer="3876" from-port="0" to-layer="3877" to-port="1" /> <edge from-layer="3877" from-port="2" to-layer="3878" to-port="0" /> <edge from-layer="3878" from-port="1" to-layer="3879" to-port="1" /> <edge from-layer="3879" from-port="2" to-layer="3881" to-port="0" /> <edge from-layer="3880" from-port="0" to-layer="3881" to-port="1" /> <edge from-layer="3881" from-port="2" to-layer="3883" to-port="0" /> <edge from-layer="3882" from-port="0" to-layer="3883" to-port="1" /> <edge from-layer="3883" from-port="2" to-layer="3884" to-port="1" /> <edge from-layer="3884" from-port="2" to-layer="6147" to-port="0" /> <edge from-layer="3884" from-port="2" to-layer="3885" to-port="0" /> <edge from-layer="3885" from-port="2" to-layer="3886" to-port="0" /> <edge from-layer="3886" from-port="2" to-layer="3888" to-port="0" /> <edge from-layer="3887" from-port="0" to-layer="3888" to-port="1" /> <edge from-layer="3888" from-port="2" to-layer="3889" to-port="2" /> <edge from-layer="3889" from-port="4" to-layer="3891" to-port="0" /> <edge from-layer="3890" from-port="0" to-layer="3891" to-port="1" /> <edge from-layer="3891" from-port="2" to-layer="3892" to-port="0" /> <edge from-layer="3892" from-port="2" to-layer="3901" to-port="0" /> <edge from-layer="3893" from-port="0" to-layer="3894" to-port="0" /> <edge from-layer="3894" from-port="1" to-layer="3897" to-port="0" /> <edge from-layer="3895" from-port="0" to-layer="3896" to-port="0" /> <edge from-layer="3896" from-port="1" to-layer="3897" to-port="1" /> <edge from-layer="3897" from-port="2" to-layer="3899" to-port="0" /> <edge from-layer="3898" from-port="0" to-layer="3899" to-port="1" /> <edge from-layer="3899" from-port="2" to-layer="3900" to-port="0" /> <edge from-layer="3900" from-port="1" to-layer="3901" to-port="1" /> <edge from-layer="3901" from-port="2" to-layer="3902" to-port="1" /> <edge from-layer="3902" from-port="2" to-layer="3944" to-port="0" /> <edge from-layer="3902" from-port="2" to-layer="3913" to-port="0" /> <edge from-layer="3902" from-port="2" to-layer="3906" to-port="0" /> <edge from-layer="3903" from-port="0" to-layer="3914" to-port="0" /> <edge from-layer="3904" from-port="0" to-layer="3912" to-port="0" /> <edge from-layer="3905" from-port="0" to-layer="3906" to-port="1" /> <edge from-layer="3906" from-port="2" to-layer="3908" to-port="0" /> <edge from-layer="3907" from-port="0" to-layer="3908" to-port="1" /> <edge from-layer="3908" from-port="2" to-layer="3910" to-port="0" /> <edge from-layer="3909" from-port="0" to-layer="3910" to-port="1" /> <edge from-layer="3910" from-port="2" to-layer="3911" to-port="0" /> <edge from-layer="3911" from-port="1" to-layer="3912" to-port="1" /> <edge from-layer="3912" from-port="2" to-layer="3913" to-port="1" /> <edge from-layer="3913" from-port="2" to-layer="3914" to-port="1" /> <edge from-layer="3914" from-port="2" to-layer="3923" to-port="0" /> <edge from-layer="3914" from-port="2" to-layer="3933" to-port="0" /> <edge from-layer="3915" from-port="0" to-layer="3916" to-port="0" /> <edge from-layer="3916" from-port="1" to-layer="3919" to-port="0" /> <edge from-layer="3917" from-port="0" to-layer="3918" to-port="0" /> <edge from-layer="3918" from-port="1" to-layer="3919" to-port="1" /> <edge from-layer="3919" from-port="2" to-layer="3921" to-port="0" /> <edge from-layer="3920" from-port="0" to-layer="3921" to-port="1" /> <edge from-layer="3921" from-port="2" to-layer="3922" to-port="0" /> <edge from-layer="3922" from-port="1" to-layer="3923" to-port="1" /> <edge from-layer="3923" from-port="2" to-layer="3924" to-port="0" /> <edge from-layer="3924" from-port="1" to-layer="3934" to-port="0" /> <edge from-layer="3925" from-port="0" to-layer="3926" to-port="0" /> <edge from-layer="3926" from-port="1" to-layer="3929" to-port="0" /> <edge from-layer="3927" from-port="0" to-layer="3928" to-port="0" /> <edge from-layer="3928" from-port="1" to-layer="3929" to-port="1" /> <edge from-layer="3929" from-port="2" to-layer="3931" to-port="0" /> <edge from-layer="3930" from-port="0" to-layer="3931" to-port="1" /> <edge from-layer="3931" from-port="2" to-layer="3932" to-port="0" /> <edge from-layer="3932" from-port="1" to-layer="3933" to-port="1" /> <edge from-layer="3933" from-port="2" to-layer="3934" to-port="1" /> <edge from-layer="3934" from-port="2" to-layer="3943" to-port="0" /> <edge from-layer="3935" from-port="0" to-layer="3936" to-port="0" /> <edge from-layer="3936" from-port="1" to-layer="3939" to-port="0" /> <edge from-layer="3937" from-port="0" to-layer="3938" to-port="0" /> <edge from-layer="3938" from-port="1" to-layer="3939" to-port="1" /> <edge from-layer="3939" from-port="2" to-layer="3941" to-port="0" /> <edge from-layer="3940" from-port="0" to-layer="3941" to-port="1" /> <edge from-layer="3941" from-port="2" to-layer="3942" to-port="0" /> <edge from-layer="3942" from-port="1" to-layer="3943" to-port="1" /> <edge from-layer="3943" from-port="2" to-layer="3944" to-port="1" /> <edge from-layer="3944" from-port="2" to-layer="4053" to-port="0" /> <edge from-layer="3944" from-port="2" to-layer="3948" to-port="0" /> <edge from-layer="3944" from-port="2" to-layer="3955" to-port="0" /> <edge from-layer="3945" from-port="0" to-layer="3956" to-port="0" /> <edge from-layer="3946" from-port="0" to-layer="3954" to-port="0" /> <edge from-layer="3947" from-port="0" to-layer="3948" to-port="1" /> <edge from-layer="3948" from-port="2" to-layer="3950" to-port="0" /> <edge from-layer="3949" from-port="0" to-layer="3950" to-port="1" /> <edge from-layer="3950" from-port="2" to-layer="3952" to-port="0" /> <edge from-layer="3951" from-port="0" to-layer="3952" to-port="1" /> <edge from-layer="3952" from-port="2" to-layer="3953" to-port="0" /> <edge from-layer="3953" from-port="1" to-layer="3954" to-port="1" /> <edge from-layer="3954" from-port="2" to-layer="3955" to-port="1" /> <edge from-layer="3955" from-port="2" to-layer="3956" to-port="1" /> <edge from-layer="3956" from-port="2" to-layer="3965" to-port="0" /> <edge from-layer="3956" from-port="2" to-layer="3995" to-port="0" /> <edge from-layer="3956" from-port="2" to-layer="4030" to-port="0" /> <edge from-layer="3957" from-port="0" to-layer="3958" to-port="0" /> <edge from-layer="3958" from-port="1" to-layer="3961" to-port="0" /> <edge from-layer="3959" from-port="0" to-layer="3960" to-port="0" /> <edge from-layer="3960" from-port="1" to-layer="3961" to-port="1" /> <edge from-layer="3961" from-port="2" to-layer="3963" to-port="0" /> <edge from-layer="3962" from-port="0" to-layer="3963" to-port="1" /> <edge from-layer="3963" from-port="2" to-layer="3964" to-port="0" /> <edge from-layer="3964" from-port="1" to-layer="3965" to-port="1" /> <edge from-layer="3965" from-port="2" to-layer="3967" to-port="0" /> <edge from-layer="3966" from-port="0" to-layer="3967" to-port="1" /> <edge from-layer="3967" from-port="2" to-layer="3969" to-port="0" /> <edge from-layer="3968" from-port="0" to-layer="3969" to-port="1" /> <edge from-layer="3969" from-port="2" to-layer="3970" to-port="0" /> <edge from-layer="3969" from-port="2" to-layer="3974" to-port="0" /> <edge from-layer="3969" from-port="2" to-layer="3980" to-port="0" /> <edge from-layer="3970" from-port="2" to-layer="3983" to-port="0" /> <edge from-layer="3971" from-port="0" to-layer="3974" to-port="1" /> <edge from-layer="3972" from-port="0" to-layer="3974" to-port="2" /> <edge from-layer="3973" from-port="0" to-layer="3974" to-port="3" /> <edge from-layer="3974" from-port="5" to-layer="3976" to-port="0" /> <edge from-layer="3975" from-port="0" to-layer="3976" to-port="1" /> <edge from-layer="3976" from-port="2" to-layer="3981" to-port="0" /> <edge from-layer="3977" from-port="0" to-layer="3980" to-port="1" /> <edge from-layer="3978" from-port="0" to-layer="3980" to-port="2" /> <edge from-layer="3979" from-port="0" to-layer="3980" to-port="3" /> <edge from-layer="3980" from-port="5" to-layer="3981" to-port="1" /> <edge from-layer="3981" from-port="2" to-layer="3982" to-port="0" /> <edge from-layer="3982" from-port="2" to-layer="3983" to-port="1" /> <edge from-layer="3983" from-port="2" to-layer="4040" to-port="0" /> <edge from-layer="3984" from-port="1" to-layer="3986" to-port="0" /> <edge from-layer="3985" from-port="0" to-layer="3986" to-port="2" /> <edge from-layer="3986" from-port="3" to-layer="4014" to-port="0" /> <edge from-layer="3987" from-port="0" to-layer="3988" to-port="0" /> <edge from-layer="3988" from-port="1" to-layer="3991" to-port="0" /> <edge from-layer="3989" from-port="0" to-layer="3990" to-port="0" /> <edge from-layer="3990" from-port="1" to-layer="3991" to-port="1" /> <edge from-layer="3991" from-port="2" to-layer="3993" to-port="0" /> <edge from-layer="3992" from-port="0" to-layer="3993" to-port="1" /> <edge from-layer="3993" from-port="2" to-layer="3994" to-port="0" /> <edge from-layer="3994" from-port="1" to-layer="3995" to-port="1" /> <edge from-layer="3995" from-port="2" to-layer="3997" to-port="0" /> <edge from-layer="3996" from-port="0" to-layer="3997" to-port="1" /> <edge from-layer="3997" from-port="2" to-layer="3999" to-port="0" /> <edge from-layer="3998" from-port="0" to-layer="3999" to-port="1" /> <edge from-layer="3999" from-port="2" to-layer="4010" to-port="0" /> <edge from-layer="3999" from-port="2" to-layer="4004" to-port="0" /> <edge from-layer="3999" from-port="2" to-layer="4000" to-port="0" /> <edge from-layer="4000" from-port="2" to-layer="4013" to-port="0" /> <edge from-layer="4001" from-port="0" to-layer="4004" to-port="1" /> <edge from-layer="4002" from-port="0" to-layer="4004" to-port="2" /> <edge from-layer="4003" from-port="0" to-layer="4004" to-port="3" /> <edge from-layer="4004" from-port="5" to-layer="4006" to-port="0" /> <edge from-layer="4005" from-port="0" to-layer="4006" to-port="1" /> <edge from-layer="4006" from-port="2" to-layer="4011" to-port="0" /> <edge from-layer="4007" from-port="0" to-layer="4010" to-port="1" /> <edge from-layer="4008" from-port="0" to-layer="4010" to-port="2" /> <edge from-layer="4009" from-port="0" to-layer="4010" to-port="3" /> <edge from-layer="4010" from-port="5" to-layer="4011" to-port="1" /> <edge from-layer="4011" from-port="2" to-layer="4012" to-port="0" /> <edge from-layer="4012" from-port="2" to-layer="4013" to-port="1" /> <edge from-layer="4013" from-port="2" to-layer="4014" to-port="1" /> <edge from-layer="4014" from-port="2" to-layer="6146" to-port="0" /> <edge from-layer="4014" from-port="2" to-layer="4015" to-port="0" /> <edge from-layer="4015" from-port="2" to-layer="4016" to-port="0" /> <edge from-layer="4016" from-port="2" to-layer="4018" to-port="0" /> <edge from-layer="4017" from-port="0" to-layer="4018" to-port="1" /> <edge from-layer="4018" from-port="2" to-layer="4040" to-port="1" /> <edge from-layer="4019" from-port="1" to-layer="4021" to-port="0" /> <edge from-layer="4020" from-port="0" to-layer="4021" to-port="2" /> <edge from-layer="4021" from-port="3" to-layer="4035" to-port="0" /> <edge from-layer="4022" from-port="0" to-layer="4023" to-port="0" /> <edge from-layer="4023" from-port="1" to-layer="4026" to-port="0" /> <edge from-layer="4024" from-port="0" to-layer="4025" to-port="0" /> <edge from-layer="4025" from-port="1" to-layer="4026" to-port="1" /> <edge from-layer="4026" from-port="2" to-layer="4028" to-port="0" /> <edge from-layer="4027" from-port="0" to-layer="4028" to-port="1" /> <edge from-layer="4028" from-port="2" to-layer="4029" to-port="0" /> <edge from-layer="4029" from-port="1" to-layer="4030" to-port="1" /> <edge from-layer="4030" from-port="2" to-layer="4032" to-port="0" /> <edge from-layer="4031" from-port="0" to-layer="4032" to-port="1" /> <edge from-layer="4032" from-port="2" to-layer="4034" to-port="0" /> <edge from-layer="4033" from-port="0" to-layer="4034" to-port="1" /> <edge from-layer="4034" from-port="2" to-layer="4035" to-port="1" /> <edge from-layer="4035" from-port="2" to-layer="6145" to-port="0" /> <edge from-layer="4035" from-port="2" to-layer="4036" to-port="0" /> <edge from-layer="4036" from-port="2" to-layer="4037" to-port="0" /> <edge from-layer="4037" from-port="2" to-layer="4039" to-port="0" /> <edge from-layer="4038" from-port="0" to-layer="4039" to-port="1" /> <edge from-layer="4039" from-port="2" to-layer="4040" to-port="2" /> <edge from-layer="4040" from-port="4" to-layer="4042" to-port="0" /> <edge from-layer="4041" from-port="0" to-layer="4042" to-port="1" /> <edge from-layer="4042" from-port="2" to-layer="4043" to-port="0" /> <edge from-layer="4043" from-port="2" to-layer="4052" to-port="0" /> <edge from-layer="4044" from-port="0" to-layer="4045" to-port="0" /> <edge from-layer="4045" from-port="1" to-layer="4048" to-port="0" /> <edge from-layer="4046" from-port="0" to-layer="4047" to-port="0" /> <edge from-layer="4047" from-port="1" to-layer="4048" to-port="1" /> <edge from-layer="4048" from-port="2" to-layer="4050" to-port="0" /> <edge from-layer="4049" from-port="0" to-layer="4050" to-port="1" /> <edge from-layer="4050" from-port="2" to-layer="4051" to-port="0" /> <edge from-layer="4051" from-port="1" to-layer="4052" to-port="1" /> <edge from-layer="4052" from-port="2" to-layer="4053" to-port="1" /> <edge from-layer="4053" from-port="2" to-layer="4064" to-port="0" /> <edge from-layer="4053" from-port="2" to-layer="4057" to-port="0" /> <edge from-layer="4053" from-port="2" to-layer="4095" to-port="0" /> <edge from-layer="4054" from-port="0" to-layer="4065" to-port="0" /> <edge from-layer="4055" from-port="0" to-layer="4063" to-port="0" /> <edge from-layer="4056" from-port="0" to-layer="4057" to-port="1" /> <edge from-layer="4057" from-port="2" to-layer="4059" to-port="0" /> <edge from-layer="4058" from-port="0" to-layer="4059" to-port="1" /> <edge from-layer="4059" from-port="2" to-layer="4061" to-port="0" /> <edge from-layer="4060" from-port="0" to-layer="4061" to-port="1" /> <edge from-layer="4061" from-port="2" to-layer="4062" to-port="0" /> <edge from-layer="4062" from-port="1" to-layer="4063" to-port="1" /> <edge from-layer="4063" from-port="2" to-layer="4064" to-port="1" /> <edge from-layer="4064" from-port="2" to-layer="4065" to-port="1" /> <edge from-layer="4065" from-port="2" to-layer="4074" to-port="0" /> <edge from-layer="4065" from-port="2" to-layer="4084" to-port="0" /> <edge from-layer="4066" from-port="0" to-layer="4067" to-port="0" /> <edge from-layer="4067" from-port="1" to-layer="4070" to-port="0" /> <edge from-layer="4068" from-port="0" to-layer="4069" to-port="0" /> <edge from-layer="4069" from-port="1" to-layer="4070" to-port="1" /> <edge from-layer="4070" from-port="2" to-layer="4072" to-port="0" /> <edge from-layer="4071" from-port="0" to-layer="4072" to-port="1" /> <edge from-layer="4072" from-port="2" to-layer="4073" to-port="0" /> <edge from-layer="4073" from-port="1" to-layer="4074" to-port="1" /> <edge from-layer="4074" from-port="2" to-layer="4075" to-port="0" /> <edge from-layer="4075" from-port="1" to-layer="4085" to-port="0" /> <edge from-layer="4076" from-port="0" to-layer="4077" to-port="0" /> <edge from-layer="4077" from-port="1" to-layer="4080" to-port="0" /> <edge from-layer="4078" from-port="0" to-layer="4079" to-port="0" /> <edge from-layer="4079" from-port="1" to-layer="4080" to-port="1" /> <edge from-layer="4080" from-port="2" to-layer="4082" to-port="0" /> <edge from-layer="4081" from-port="0" to-layer="4082" to-port="1" /> <edge from-layer="4082" from-port="2" to-layer="4083" to-port="0" /> <edge from-layer="4083" from-port="1" to-layer="4084" to-port="1" /> <edge from-layer="4084" from-port="2" to-layer="4085" to-port="1" /> <edge from-layer="4085" from-port="2" to-layer="4094" to-port="0" /> <edge from-layer="4086" from-port="0" to-layer="4087" to-port="0" /> <edge from-layer="4087" from-port="1" to-layer="4090" to-port="0" /> <edge from-layer="4088" from-port="0" to-layer="4089" to-port="0" /> <edge from-layer="4089" from-port="1" to-layer="4090" to-port="1" /> <edge from-layer="4090" from-port="2" to-layer="4092" to-port="0" /> <edge from-layer="4091" from-port="0" to-layer="4092" to-port="1" /> <edge from-layer="4092" from-port="2" to-layer="4093" to-port="0" /> <edge from-layer="4093" from-port="1" to-layer="4094" to-port="1" /> <edge from-layer="4094" from-port="2" to-layer="4095" to-port="1" /> <edge from-layer="4095" from-port="2" to-layer="4106" to-port="0" /> <edge from-layer="4095" from-port="2" to-layer="4204" to-port="0" /> <edge from-layer="4095" from-port="2" to-layer="4099" to-port="0" /> <edge from-layer="4096" from-port="0" to-layer="4107" to-port="0" /> <edge from-layer="4097" from-port="0" to-layer="4105" to-port="0" /> <edge from-layer="4098" from-port="0" to-layer="4099" to-port="1" /> <edge from-layer="4099" from-port="2" to-layer="4101" to-port="0" /> <edge from-layer="4100" from-port="0" to-layer="4101" to-port="1" /> <edge from-layer="4101" from-port="2" to-layer="4103" to-port="0" /> <edge from-layer="4102" from-port="0" to-layer="4103" to-port="1" /> <edge from-layer="4103" from-port="2" to-layer="4104" to-port="0" /> <edge from-layer="4104" from-port="1" to-layer="4105" to-port="1" /> <edge from-layer="4105" from-port="2" to-layer="4106" to-port="1" /> <edge from-layer="4106" from-port="2" to-layer="4107" to-port="1" /> <edge from-layer="4107" from-port="2" to-layer="4116" to-port="0" /> <edge from-layer="4107" from-port="2" to-layer="4181" to-port="0" /> <edge from-layer="4107" from-port="2" to-layer="4146" to-port="0" /> <edge from-layer="4108" from-port="0" to-layer="4109" to-port="0" /> <edge from-layer="4109" from-port="1" to-layer="4112" to-port="0" /> <edge from-layer="4110" from-port="0" to-layer="4111" to-port="0" /> <edge from-layer="4111" from-port="1" to-layer="4112" to-port="1" /> <edge from-layer="4112" from-port="2" to-layer="4114" to-port="0" /> <edge from-layer="4113" from-port="0" to-layer="4114" to-port="1" /> <edge from-layer="4114" from-port="2" to-layer="4115" to-port="0" /> <edge from-layer="4115" from-port="1" to-layer="4116" to-port="1" /> <edge from-layer="4116" from-port="2" to-layer="4118" to-port="0" /> <edge from-layer="4117" from-port="0" to-layer="4118" to-port="1" /> <edge from-layer="4118" from-port="2" to-layer="4120" to-port="0" /> <edge from-layer="4119" from-port="0" to-layer="4120" to-port="1" /> <edge from-layer="4120" from-port="2" to-layer="4121" to-port="0" /> <edge from-layer="4120" from-port="2" to-layer="4125" to-port="0" /> <edge from-layer="4120" from-port="2" to-layer="4131" to-port="0" /> <edge from-layer="4121" from-port="2" to-layer="4134" to-port="0" /> <edge from-layer="4122" from-port="0" to-layer="4125" to-port="1" /> <edge from-layer="4123" from-port="0" to-layer="4125" to-port="2" /> <edge from-layer="4124" from-port="0" to-layer="4125" to-port="3" /> <edge from-layer="4125" from-port="5" to-layer="4127" to-port="0" /> <edge from-layer="4126" from-port="0" to-layer="4127" to-port="1" /> <edge from-layer="4127" from-port="2" to-layer="4132" to-port="0" /> <edge from-layer="4128" from-port="0" to-layer="4131" to-port="1" /> <edge from-layer="4129" from-port="0" to-layer="4131" to-port="2" /> <edge from-layer="4130" from-port="0" to-layer="4131" to-port="3" /> <edge from-layer="4131" from-port="5" to-layer="4132" to-port="1" /> <edge from-layer="4132" from-port="2" to-layer="4133" to-port="0" /> <edge from-layer="4133" from-port="2" to-layer="4134" to-port="1" /> <edge from-layer="4134" from-port="2" to-layer="4191" to-port="0" /> <edge from-layer="4135" from-port="1" to-layer="4137" to-port="0" /> <edge from-layer="4136" from-port="0" to-layer="4137" to-port="2" /> <edge from-layer="4137" from-port="3" to-layer="4165" to-port="0" /> <edge from-layer="4138" from-port="0" to-layer="4139" to-port="0" /> <edge from-layer="4139" from-port="1" to-layer="4142" to-port="0" /> <edge from-layer="4140" from-port="0" to-layer="4141" to-port="0" /> <edge from-layer="4141" from-port="1" to-layer="4142" to-port="1" /> <edge from-layer="4142" from-port="2" to-layer="4144" to-port="0" /> <edge from-layer="4143" from-port="0" to-layer="4144" to-port="1" /> <edge from-layer="4144" from-port="2" to-layer="4145" to-port="0" /> <edge from-layer="4145" from-port="1" to-layer="4146" to-port="1" /> <edge from-layer="4146" from-port="2" to-layer="4148" to-port="0" /> <edge from-layer="4147" from-port="0" to-layer="4148" to-port="1" /> <edge from-layer="4148" from-port="2" to-layer="4150" to-port="0" /> <edge from-layer="4149" from-port="0" to-layer="4150" to-port="1" /> <edge from-layer="4150" from-port="2" to-layer="4151" to-port="0" /> <edge from-layer="4150" from-port="2" to-layer="4155" to-port="0" /> <edge from-layer="4150" from-port="2" to-layer="4161" to-port="0" /> <edge from-layer="4151" from-port="2" to-layer="4164" to-port="0" /> <edge from-layer="4152" from-port="0" to-layer="4155" to-port="1" /> <edge from-layer="4153" from-port="0" to-layer="4155" to-port="2" /> <edge from-layer="4154" from-port="0" to-layer="4155" to-port="3" /> <edge from-layer="4155" from-port="5" to-layer="4157" to-port="0" /> <edge from-layer="4156" from-port="0" to-layer="4157" to-port="1" /> <edge from-layer="4157" from-port="2" to-layer="4162" to-port="0" /> <edge from-layer="4158" from-port="0" to-layer="4161" to-port="1" /> <edge from-layer="4159" from-port="0" to-layer="4161" to-port="2" /> <edge from-layer="4160" from-port="0" to-layer="4161" to-port="3" /> <edge from-layer="4161" from-port="5" to-layer="4162" to-port="1" /> <edge from-layer="4162" from-port="2" to-layer="4163" to-port="0" /> <edge from-layer="4163" from-port="2" to-layer="4164" to-port="1" /> <edge from-layer="4164" from-port="2" to-layer="4165" to-port="1" /> <edge from-layer="4165" from-port="2" to-layer="6144" to-port="0" /> <edge from-layer="4165" from-port="2" to-layer="4166" to-port="0" /> <edge from-layer="4166" from-port="2" to-layer="4167" to-port="0" /> <edge from-layer="4167" from-port="2" to-layer="4169" to-port="0" /> <edge from-layer="4168" from-port="0" to-layer="4169" to-port="1" /> <edge from-layer="4169" from-port="2" to-layer="4191" to-port="1" /> <edge from-layer="4170" from-port="1" to-layer="4172" to-port="0" /> <edge from-layer="4171" from-port="0" to-layer="4172" to-port="2" /> <edge from-layer="4172" from-port="3" to-layer="4186" to-port="0" /> <edge from-layer="4173" from-port="0" to-layer="4174" to-port="0" /> <edge from-layer="4174" from-port="1" to-layer="4177" to-port="0" /> <edge from-layer="4175" from-port="0" to-layer="4176" to-port="0" /> <edge from-layer="4176" from-port="1" to-layer="4177" to-port="1" /> <edge from-layer="4177" from-port="2" to-layer="4179" to-port="0" /> <edge from-layer="4178" from-port="0" to-layer="4179" to-port="1" /> <edge from-layer="4179" from-port="2" to-layer="4180" to-port="0" /> <edge from-layer="4180" from-port="1" to-layer="4181" to-port="1" /> <edge from-layer="4181" from-port="2" to-layer="4183" to-port="0" /> <edge from-layer="4182" from-port="0" to-layer="4183" to-port="1" /> <edge from-layer="4183" from-port="2" to-layer="4185" to-port="0" /> <edge from-layer="4184" from-port="0" to-layer="4185" to-port="1" /> <edge from-layer="4185" from-port="2" to-layer="4186" to-port="1" /> <edge from-layer="4186" from-port="2" to-layer="6143" to-port="0" /> <edge from-layer="4186" from-port="2" to-layer="4187" to-port="0" /> <edge from-layer="4187" from-port="2" to-layer="4188" to-port="0" /> <edge from-layer="4188" from-port="2" to-layer="4190" to-port="0" /> <edge from-layer="4189" from-port="0" to-layer="4190" to-port="1" /> <edge from-layer="4190" from-port="2" to-layer="4191" to-port="2" /> <edge from-layer="4191" from-port="4" to-layer="4193" to-port="0" /> <edge from-layer="4192" from-port="0" to-layer="4193" to-port="1" /> <edge from-layer="4193" from-port="2" to-layer="4194" to-port="0" /> <edge from-layer="4194" from-port="2" to-layer="4203" to-port="0" /> <edge from-layer="4195" from-port="0" to-layer="4196" to-port="0" /> <edge from-layer="4196" from-port="1" to-layer="4199" to-port="0" /> <edge from-layer="4197" from-port="0" to-layer="4198" to-port="0" /> <edge from-layer="4198" from-port="1" to-layer="4199" to-port="1" /> <edge from-layer="4199" from-port="2" to-layer="4201" to-port="0" /> <edge from-layer="4200" from-port="0" to-layer="4201" to-port="1" /> <edge from-layer="4201" from-port="2" to-layer="4202" to-port="0" /> <edge from-layer="4202" from-port="1" to-layer="4203" to-port="1" /> <edge from-layer="4203" from-port="2" to-layer="4204" to-port="1" /> <edge from-layer="4204" from-port="2" to-layer="4246" to-port="0" /> <edge from-layer="4204" from-port="2" to-layer="4215" to-port="0" /> <edge from-layer="4204" from-port="2" to-layer="4208" to-port="0" /> <edge from-layer="4205" from-port="0" to-layer="4216" to-port="0" /> <edge from-layer="4206" from-port="0" to-layer="4214" to-port="0" /> <edge from-layer="4207" from-port="0" to-layer="4208" to-port="1" /> <edge from-layer="4208" from-port="2" to-layer="4210" to-port="0" /> <edge from-layer="4209" from-port="0" to-layer="4210" to-port="1" /> <edge from-layer="4210" from-port="2" to-layer="4212" to-port="0" /> <edge from-layer="4211" from-port="0" to-layer="4212" to-port="1" /> <edge from-layer="4212" from-port="2" to-layer="4213" to-port="0" /> <edge from-layer="4213" from-port="1" to-layer="4214" to-port="1" /> <edge from-layer="4214" from-port="2" to-layer="4215" to-port="1" /> <edge from-layer="4215" from-port="2" to-layer="4216" to-port="1" /> <edge from-layer="4216" from-port="2" to-layer="4235" to-port="0" /> <edge from-layer="4216" from-port="2" to-layer="4225" to-port="0" /> <edge from-layer="4217" from-port="0" to-layer="4218" to-port="0" /> <edge from-layer="4218" from-port="1" to-layer="4221" to-port="0" /> <edge from-layer="4219" from-port="0" to-layer="4220" to-port="0" /> <edge from-layer="4220" from-port="1" to-layer="4221" to-port="1" /> <edge from-layer="4221" from-port="2" to-layer="4223" to-port="0" /> <edge from-layer="4222" from-port="0" to-layer="4223" to-port="1" /> <edge from-layer="4223" from-port="2" to-layer="4224" to-port="0" /> <edge from-layer="4224" from-port="1" to-layer="4225" to-port="1" /> <edge from-layer="4225" from-port="2" to-layer="4226" to-port="0" /> <edge from-layer="4226" from-port="1" to-layer="4236" to-port="0" /> <edge from-layer="4227" from-port="0" to-layer="4228" to-port="0" /> <edge from-layer="4228" from-port="1" to-layer="4231" to-port="0" /> <edge from-layer="4229" from-port="0" to-layer="4230" to-port="0" /> <edge from-layer="4230" from-port="1" to-layer="4231" to-port="1" /> <edge from-layer="4231" from-port="2" to-layer="4233" to-port="0" /> <edge from-layer="4232" from-port="0" to-layer="4233" to-port="1" /> <edge from-layer="4233" from-port="2" to-layer="4234" to-port="0" /> <edge from-layer="4234" from-port="1" to-layer="4235" to-port="1" /> <edge from-layer="4235" from-port="2" to-layer="4236" to-port="1" /> <edge from-layer="4236" from-port="2" to-layer="4245" to-port="0" /> <edge from-layer="4237" from-port="0" to-layer="4238" to-port="0" /> <edge from-layer="4238" from-port="1" to-layer="4241" to-port="0" /> <edge from-layer="4239" from-port="0" to-layer="4240" to-port="0" /> <edge from-layer="4240" from-port="1" to-layer="4241" to-port="1" /> <edge from-layer="4241" from-port="2" to-layer="4243" to-port="0" /> <edge from-layer="4242" from-port="0" to-layer="4243" to-port="1" /> <edge from-layer="4243" from-port="2" to-layer="4244" to-port="0" /> <edge from-layer="4244" from-port="1" to-layer="4245" to-port="1" /> <edge from-layer="4245" from-port="2" to-layer="4246" to-port="1" /> <edge from-layer="4246" from-port="2" to-layer="4250" to-port="0" /> <edge from-layer="4246" from-port="2" to-layer="4257" to-port="0" /> <edge from-layer="4246" from-port="2" to-layer="4355" to-port="0" /> <edge from-layer="4247" from-port="0" to-layer="4258" to-port="0" /> <edge from-layer="4248" from-port="0" to-layer="4256" to-port="0" /> <edge from-layer="4249" from-port="0" to-layer="4250" to-port="1" /> <edge from-layer="4250" from-port="2" to-layer="4252" to-port="0" /> <edge from-layer="4251" from-port="0" to-layer="4252" to-port="1" /> <edge from-layer="4252" from-port="2" to-layer="4254" to-port="0" /> <edge from-layer="4253" from-port="0" to-layer="4254" to-port="1" /> <edge from-layer="4254" from-port="2" to-layer="4255" to-port="0" /> <edge from-layer="4255" from-port="1" to-layer="4256" to-port="1" /> <edge from-layer="4256" from-port="2" to-layer="4257" to-port="1" /> <edge from-layer="4257" from-port="2" to-layer="4258" to-port="1" /> <edge from-layer="4258" from-port="2" to-layer="4267" to-port="0" /> <edge from-layer="4258" from-port="2" to-layer="4297" to-port="0" /> <edge from-layer="4258" from-port="2" to-layer="4332" to-port="0" /> <edge from-layer="4259" from-port="0" to-layer="4260" to-port="0" /> <edge from-layer="4260" from-port="1" to-layer="4263" to-port="0" /> <edge from-layer="4261" from-port="0" to-layer="4262" to-port="0" /> <edge from-layer="4262" from-port="1" to-layer="4263" to-port="1" /> <edge from-layer="4263" from-port="2" to-layer="4265" to-port="0" /> <edge from-layer="4264" from-port="0" to-layer="4265" to-port="1" /> <edge from-layer="4265" from-port="2" to-layer="4266" to-port="0" /> <edge from-layer="4266" from-port="1" to-layer="4267" to-port="1" /> <edge from-layer="4267" from-port="2" to-layer="4269" to-port="0" /> <edge from-layer="4268" from-port="0" to-layer="4269" to-port="1" /> <edge from-layer="4269" from-port="2" to-layer="4271" to-port="0" /> <edge from-layer="4270" from-port="0" to-layer="4271" to-port="1" /> <edge from-layer="4271" from-port="2" to-layer="4282" to-port="0" /> <edge from-layer="4271" from-port="2" to-layer="4276" to-port="0" /> <edge from-layer="4271" from-port="2" to-layer="4272" to-port="0" /> <edge from-layer="4272" from-port="2" to-layer="4285" to-port="0" /> <edge from-layer="4273" from-port="0" to-layer="4276" to-port="1" /> <edge from-layer="4274" from-port="0" to-layer="4276" to-port="2" /> <edge from-layer="4275" from-port="0" to-layer="4276" to-port="3" /> <edge from-layer="4276" from-port="5" to-layer="4278" to-port="0" /> <edge from-layer="4277" from-port="0" to-layer="4278" to-port="1" /> <edge from-layer="4278" from-port="2" to-layer="4283" to-port="0" /> <edge from-layer="4279" from-port="0" to-layer="4282" to-port="1" /> <edge from-layer="4280" from-port="0" to-layer="4282" to-port="2" /> <edge from-layer="4281" from-port="0" to-layer="4282" to-port="3" /> <edge from-layer="4282" from-port="5" to-layer="4283" to-port="1" /> <edge from-layer="4283" from-port="2" to-layer="4284" to-port="0" /> <edge from-layer="4284" from-port="2" to-layer="4285" to-port="1" /> <edge from-layer="4285" from-port="2" to-layer="4342" to-port="0" /> <edge from-layer="4286" from-port="1" to-layer="4288" to-port="0" /> <edge from-layer="4287" from-port="0" to-layer="4288" to-port="2" /> <edge from-layer="4288" from-port="3" to-layer="4316" to-port="0" /> <edge from-layer="4289" from-port="0" to-layer="4290" to-port="0" /> <edge from-layer="4290" from-port="1" to-layer="4293" to-port="0" /> <edge from-layer="4291" from-port="0" to-layer="4292" to-port="0" /> <edge from-layer="4292" from-port="1" to-layer="4293" to-port="1" /> <edge from-layer="4293" from-port="2" to-layer="4295" to-port="0" /> <edge from-layer="4294" from-port="0" to-layer="4295" to-port="1" /> <edge from-layer="4295" from-port="2" to-layer="4296" to-port="0" /> <edge from-layer="4296" from-port="1" to-layer="4297" to-port="1" /> <edge from-layer="4297" from-port="2" to-layer="4299" to-port="0" /> <edge from-layer="4298" from-port="0" to-layer="4299" to-port="1" /> <edge from-layer="4299" from-port="2" to-layer="4301" to-port="0" /> <edge from-layer="4300" from-port="0" to-layer="4301" to-port="1" /> <edge from-layer="4301" from-port="2" to-layer="4312" to-port="0" /> <edge from-layer="4301" from-port="2" to-layer="4306" to-port="0" /> <edge from-layer="4301" from-port="2" to-layer="4302" to-port="0" /> <edge from-layer="4302" from-port="2" to-layer="4315" to-port="0" /> <edge from-layer="4303" from-port="0" to-layer="4306" to-port="1" /> <edge from-layer="4304" from-port="0" to-layer="4306" to-port="2" /> <edge from-layer="4305" from-port="0" to-layer="4306" to-port="3" /> <edge from-layer="4306" from-port="5" to-layer="4308" to-port="0" /> <edge from-layer="4307" from-port="0" to-layer="4308" to-port="1" /> <edge from-layer="4308" from-port="2" to-layer="4313" to-port="0" /> <edge from-layer="4309" from-port="0" to-layer="4312" to-port="1" /> <edge from-layer="4310" from-port="0" to-layer="4312" to-port="2" /> <edge from-layer="4311" from-port="0" to-layer="4312" to-port="3" /> <edge from-layer="4312" from-port="5" to-layer="4313" to-port="1" /> <edge from-layer="4313" from-port="2" to-layer="4314" to-port="0" /> <edge from-layer="4314" from-port="2" to-layer="4315" to-port="1" /> <edge from-layer="4315" from-port="2" to-layer="4316" to-port="1" /> <edge from-layer="4316" from-port="2" to-layer="6142" to-port="0" /> <edge from-layer="4316" from-port="2" to-layer="4317" to-port="0" /> <edge from-layer="4317" from-port="2" to-layer="4318" to-port="0" /> <edge from-layer="4318" from-port="2" to-layer="4320" to-port="0" /> <edge from-layer="4319" from-port="0" to-layer="4320" to-port="1" /> <edge from-layer="4320" from-port="2" to-layer="4342" to-port="1" /> <edge from-layer="4321" from-port="1" to-layer="4323" to-port="0" /> <edge from-layer="4322" from-port="0" to-layer="4323" to-port="2" /> <edge from-layer="4323" from-port="3" to-layer="4337" to-port="0" /> <edge from-layer="4324" from-port="0" to-layer="4325" to-port="0" /> <edge from-layer="4325" from-port="1" to-layer="4328" to-port="0" /> <edge from-layer="4326" from-port="0" to-layer="4327" to-port="0" /> <edge from-layer="4327" from-port="1" to-layer="4328" to-port="1" /> <edge from-layer="4328" from-port="2" to-layer="4330" to-port="0" /> <edge from-layer="4329" from-port="0" to-layer="4330" to-port="1" /> <edge from-layer="4330" from-port="2" to-layer="4331" to-port="0" /> <edge from-layer="4331" from-port="1" to-layer="4332" to-port="1" /> <edge from-layer="4332" from-port="2" to-layer="4334" to-port="0" /> <edge from-layer="4333" from-port="0" to-layer="4334" to-port="1" /> <edge from-layer="4334" from-port="2" to-layer="4336" to-port="0" /> <edge from-layer="4335" from-port="0" to-layer="4336" to-port="1" /> <edge from-layer="4336" from-port="2" to-layer="4337" to-port="1" /> <edge from-layer="4337" from-port="2" to-layer="6141" to-port="0" /> <edge from-layer="4337" from-port="2" to-layer="4338" to-port="0" /> <edge from-layer="4338" from-port="2" to-layer="4339" to-port="0" /> <edge from-layer="4339" from-port="2" to-layer="4341" to-port="0" /> <edge from-layer="4340" from-port="0" to-layer="4341" to-port="1" /> <edge from-layer="4341" from-port="2" to-layer="4342" to-port="2" /> <edge from-layer="4342" from-port="4" to-layer="4344" to-port="0" /> <edge from-layer="4343" from-port="0" to-layer="4344" to-port="1" /> <edge from-layer="4344" from-port="2" to-layer="4345" to-port="0" /> <edge from-layer="4345" from-port="2" to-layer="4354" to-port="0" /> <edge from-layer="4346" from-port="0" to-layer="4347" to-port="0" /> <edge from-layer="4347" from-port="1" to-layer="4350" to-port="0" /> <edge from-layer="4348" from-port="0" to-layer="4349" to-port="0" /> <edge from-layer="4349" from-port="1" to-layer="4350" to-port="1" /> <edge from-layer="4350" from-port="2" to-layer="4352" to-port="0" /> <edge from-layer="4351" from-port="0" to-layer="4352" to-port="1" /> <edge from-layer="4352" from-port="2" to-layer="4353" to-port="0" /> <edge from-layer="4353" from-port="1" to-layer="4354" to-port="1" /> <edge from-layer="4354" from-port="2" to-layer="4355" to-port="1" /> <edge from-layer="4355" from-port="2" to-layer="4359" to-port="0" /> <edge from-layer="4355" from-port="2" to-layer="4397" to-port="0" /> <edge from-layer="4355" from-port="2" to-layer="4366" to-port="0" /> <edge from-layer="4356" from-port="0" to-layer="4367" to-port="0" /> <edge from-layer="4357" from-port="0" to-layer="4365" to-port="0" /> <edge from-layer="4358" from-port="0" to-layer="4359" to-port="1" /> <edge from-layer="4359" from-port="2" to-layer="4361" to-port="0" /> <edge from-layer="4360" from-port="0" to-layer="4361" to-port="1" /> <edge from-layer="4361" from-port="2" to-layer="4363" to-port="0" /> <edge from-layer="4362" from-port="0" to-layer="4363" to-port="1" /> <edge from-layer="4363" from-port="2" to-layer="4364" to-port="0" /> <edge from-layer="4364" from-port="1" to-layer="4365" to-port="1" /> <edge from-layer="4365" from-port="2" to-layer="4366" to-port="1" /> <edge from-layer="4366" from-port="2" to-layer="4367" to-port="1" /> <edge from-layer="4367" from-port="2" to-layer="4386" to-port="0" /> <edge from-layer="4367" from-port="2" to-layer="4376" to-port="0" /> <edge from-layer="4368" from-port="0" to-layer="4369" to-port="0" /> <edge from-layer="4369" from-port="1" to-layer="4372" to-port="0" /> <edge from-layer="4370" from-port="0" to-layer="4371" to-port="0" /> <edge from-layer="4371" from-port="1" to-layer="4372" to-port="1" /> <edge from-layer="4372" from-port="2" to-layer="4374" to-port="0" /> <edge from-layer="4373" from-port="0" to-layer="4374" to-port="1" /> <edge from-layer="4374" from-port="2" to-layer="4375" to-port="0" /> <edge from-layer="4375" from-port="1" to-layer="4376" to-port="1" /> <edge from-layer="4376" from-port="2" to-layer="4377" to-port="0" /> <edge from-layer="4377" from-port="1" to-layer="4387" to-port="0" /> <edge from-layer="4378" from-port="0" to-layer="4379" to-port="0" /> <edge from-layer="4379" from-port="1" to-layer="4382" to-port="0" /> <edge from-layer="4380" from-port="0" to-layer="4381" to-port="0" /> <edge from-layer="4381" from-port="1" to-layer="4382" to-port="1" /> <edge from-layer="4382" from-port="2" to-layer="4384" to-port="0" /> <edge from-layer="4383" from-port="0" to-layer="4384" to-port="1" /> <edge from-layer="4384" from-port="2" to-layer="4385" to-port="0" /> <edge from-layer="4385" from-port="1" to-layer="4386" to-port="1" /> <edge from-layer="4386" from-port="2" to-layer="4387" to-port="1" /> <edge from-layer="4387" from-port="2" to-layer="4396" to-port="0" /> <edge from-layer="4388" from-port="0" to-layer="4389" to-port="0" /> <edge from-layer="4389" from-port="1" to-layer="4392" to-port="0" /> <edge from-layer="4390" from-port="0" to-layer="4391" to-port="0" /> <edge from-layer="4391" from-port="1" to-layer="4392" to-port="1" /> <edge from-layer="4392" from-port="2" to-layer="4394" to-port="0" /> <edge from-layer="4393" from-port="0" to-layer="4394" to-port="1" /> <edge from-layer="4394" from-port="2" to-layer="4395" to-port="0" /> <edge from-layer="4395" from-port="1" to-layer="4396" to-port="1" /> <edge from-layer="4396" from-port="2" to-layer="4397" to-port="1" /> <edge from-layer="4397" from-port="2" to-layer="4506" to-port="0" /> <edge from-layer="4397" from-port="2" to-layer="4408" to-port="0" /> <edge from-layer="4397" from-port="2" to-layer="4401" to-port="0" /> <edge from-layer="4398" from-port="0" to-layer="4409" to-port="0" /> <edge from-layer="4399" from-port="0" to-layer="4407" to-port="0" /> <edge from-layer="4400" from-port="0" to-layer="4401" to-port="1" /> <edge from-layer="4401" from-port="2" to-layer="4403" to-port="0" /> <edge from-layer="4402" from-port="0" to-layer="4403" to-port="1" /> <edge from-layer="4403" from-port="2" to-layer="4405" to-port="0" /> <edge from-layer="4404" from-port="0" to-layer="4405" to-port="1" /> <edge from-layer="4405" from-port="2" to-layer="4406" to-port="0" /> <edge from-layer="4406" from-port="1" to-layer="4407" to-port="1" /> <edge from-layer="4407" from-port="2" to-layer="4408" to-port="1" /> <edge from-layer="4408" from-port="2" to-layer="4409" to-port="1" /> <edge from-layer="4409" from-port="2" to-layer="4483" to-port="0" /> <edge from-layer="4409" from-port="2" to-layer="4418" to-port="0" /> <edge from-layer="4409" from-port="2" to-layer="4448" to-port="0" /> <edge from-layer="4410" from-port="0" to-layer="4411" to-port="0" /> <edge from-layer="4411" from-port="1" to-layer="4414" to-port="0" /> <edge from-layer="4412" from-port="0" to-layer="4413" to-port="0" /> <edge from-layer="4413" from-port="1" to-layer="4414" to-port="1" /> <edge from-layer="4414" from-port="2" to-layer="4416" to-port="0" /> <edge from-layer="4415" from-port="0" to-layer="4416" to-port="1" /> <edge from-layer="4416" from-port="2" to-layer="4417" to-port="0" /> <edge from-layer="4417" from-port="1" to-layer="4418" to-port="1" /> <edge from-layer="4418" from-port="2" to-layer="4420" to-port="0" /> <edge from-layer="4419" from-port="0" to-layer="4420" to-port="1" /> <edge from-layer="4420" from-port="2" to-layer="4422" to-port="0" /> <edge from-layer="4421" from-port="0" to-layer="4422" to-port="1" /> <edge from-layer="4422" from-port="2" to-layer="4433" to-port="0" /> <edge from-layer="4422" from-port="2" to-layer="4423" to-port="0" /> <edge from-layer="4422" from-port="2" to-layer="4427" to-port="0" /> <edge from-layer="4423" from-port="2" to-layer="4436" to-port="0" /> <edge from-layer="4424" from-port="0" to-layer="4427" to-port="1" /> <edge from-layer="4425" from-port="0" to-layer="4427" to-port="2" /> <edge from-layer="4426" from-port="0" to-layer="4427" to-port="3" /> <edge from-layer="4427" from-port="5" to-layer="4429" to-port="0" /> <edge from-layer="4428" from-port="0" to-layer="4429" to-port="1" /> <edge from-layer="4429" from-port="2" to-layer="4434" to-port="0" /> <edge from-layer="4430" from-port="0" to-layer="4433" to-port="1" /> <edge from-layer="4431" from-port="0" to-layer="4433" to-port="2" /> <edge from-layer="4432" from-port="0" to-layer="4433" to-port="3" /> <edge from-layer="4433" from-port="5" to-layer="4434" to-port="1" /> <edge from-layer="4434" from-port="2" to-layer="4435" to-port="0" /> <edge from-layer="4435" from-port="2" to-layer="4436" to-port="1" /> <edge from-layer="4436" from-port="2" to-layer="4493" to-port="0" /> <edge from-layer="4437" from-port="1" to-layer="4439" to-port="0" /> <edge from-layer="4438" from-port="0" to-layer="4439" to-port="2" /> <edge from-layer="4439" from-port="3" to-layer="4467" to-port="0" /> <edge from-layer="4440" from-port="0" to-layer="4441" to-port="0" /> <edge from-layer="4441" from-port="1" to-layer="4444" to-port="0" /> <edge from-layer="4442" from-port="0" to-layer="4443" to-port="0" /> <edge from-layer="4443" from-port="1" to-layer="4444" to-port="1" /> <edge from-layer="4444" from-port="2" to-layer="4446" to-port="0" /> <edge from-layer="4445" from-port="0" to-layer="4446" to-port="1" /> <edge from-layer="4446" from-port="2" to-layer="4447" to-port="0" /> <edge from-layer="4447" from-port="1" to-layer="4448" to-port="1" /> <edge from-layer="4448" from-port="2" to-layer="4450" to-port="0" /> <edge from-layer="4449" from-port="0" to-layer="4450" to-port="1" /> <edge from-layer="4450" from-port="2" to-layer="4452" to-port="0" /> <edge from-layer="4451" from-port="0" to-layer="4452" to-port="1" /> <edge from-layer="4452" from-port="2" to-layer="4463" to-port="0" /> <edge from-layer="4452" from-port="2" to-layer="4453" to-port="0" /> <edge from-layer="4452" from-port="2" to-layer="4457" to-port="0" /> <edge from-layer="4453" from-port="2" to-layer="4466" to-port="0" /> <edge from-layer="4454" from-port="0" to-layer="4457" to-port="1" /> <edge from-layer="4455" from-port="0" to-layer="4457" to-port="2" /> <edge from-layer="4456" from-port="0" to-layer="4457" to-port="3" /> <edge from-layer="4457" from-port="5" to-layer="4459" to-port="0" /> <edge from-layer="4458" from-port="0" to-layer="4459" to-port="1" /> <edge from-layer="4459" from-port="2" to-layer="4464" to-port="0" /> <edge from-layer="4460" from-port="0" to-layer="4463" to-port="1" /> <edge from-layer="4461" from-port="0" to-layer="4463" to-port="2" /> <edge from-layer="4462" from-port="0" to-layer="4463" to-port="3" /> <edge from-layer="4463" from-port="5" to-layer="4464" to-port="1" /> <edge from-layer="4464" from-port="2" to-layer="4465" to-port="0" /> <edge from-layer="4465" from-port="2" to-layer="4466" to-port="1" /> <edge from-layer="4466" from-port="2" to-layer="4467" to-port="1" /> <edge from-layer="4467" from-port="2" to-layer="6140" to-port="0" /> <edge from-layer="4467" from-port="2" to-layer="4468" to-port="0" /> <edge from-layer="4468" from-port="2" to-layer="4469" to-port="0" /> <edge from-layer="4469" from-port="2" to-layer="4471" to-port="0" /> <edge from-layer="4470" from-port="0" to-layer="4471" to-port="1" /> <edge from-layer="4471" from-port="2" to-layer="4493" to-port="1" /> <edge from-layer="4472" from-port="1" to-layer="4474" to-port="0" /> <edge from-layer="4473" from-port="0" to-layer="4474" to-port="2" /> <edge from-layer="4474" from-port="3" to-layer="4488" to-port="0" /> <edge from-layer="4475" from-port="0" to-layer="4476" to-port="0" /> <edge from-layer="4476" from-port="1" to-layer="4479" to-port="0" /> <edge from-layer="4477" from-port="0" to-layer="4478" to-port="0" /> <edge from-layer="4478" from-port="1" to-layer="4479" to-port="1" /> <edge from-layer="4479" from-port="2" to-layer="4481" to-port="0" /> <edge from-layer="4480" from-port="0" to-layer="4481" to-port="1" /> <edge from-layer="4481" from-port="2" to-layer="4482" to-port="0" /> <edge from-layer="4482" from-port="1" to-layer="4483" to-port="1" /> <edge from-layer="4483" from-port="2" to-layer="4485" to-port="0" /> <edge from-layer="4484" from-port="0" to-layer="4485" to-port="1" /> <edge from-layer="4485" from-port="2" to-layer="4487" to-port="0" /> <edge from-layer="4486" from-port="0" to-layer="4487" to-port="1" /> <edge from-layer="4487" from-port="2" to-layer="4488" to-port="1" /> <edge from-layer="4488" from-port="2" to-layer="4489" to-port="0" /> <edge from-layer="4488" from-port="2" to-layer="6139" to-port="0" /> <edge from-layer="4489" from-port="2" to-layer="4490" to-port="0" /> <edge from-layer="4490" from-port="2" to-layer="4492" to-port="0" /> <edge from-layer="4491" from-port="0" to-layer="4492" to-port="1" /> <edge from-layer="4492" from-port="2" to-layer="4493" to-port="2" /> <edge from-layer="4493" from-port="4" to-layer="4495" to-port="0" /> <edge from-layer="4494" from-port="0" to-layer="4495" to-port="1" /> <edge from-layer="4495" from-port="2" to-layer="4496" to-port="0" /> <edge from-layer="4496" from-port="2" to-layer="4505" to-port="0" /> <edge from-layer="4497" from-port="0" to-layer="4498" to-port="0" /> <edge from-layer="4498" from-port="1" to-layer="4501" to-port="0" /> <edge from-layer="4499" from-port="0" to-layer="4500" to-port="0" /> <edge from-layer="4500" from-port="1" to-layer="4501" to-port="1" /> <edge from-layer="4501" from-port="2" to-layer="4503" to-port="0" /> <edge from-layer="4502" from-port="0" to-layer="4503" to-port="1" /> <edge from-layer="4503" from-port="2" to-layer="4504" to-port="0" /> <edge from-layer="4504" from-port="1" to-layer="4505" to-port="1" /> <edge from-layer="4505" from-port="2" to-layer="4506" to-port="1" /> <edge from-layer="4506" from-port="2" to-layer="4510" to-port="0" /> <edge from-layer="4506" from-port="2" to-layer="4517" to-port="0" /> <edge from-layer="4506" from-port="2" to-layer="4548" to-port="0" /> <edge from-layer="4507" from-port="0" to-layer="4518" to-port="0" /> <edge from-layer="4508" from-port="0" to-layer="4516" to-port="0" /> <edge from-layer="4509" from-port="0" to-layer="4510" to-port="1" /> <edge from-layer="4510" from-port="2" to-layer="4512" to-port="0" /> <edge from-layer="4511" from-port="0" to-layer="4512" to-port="1" /> <edge from-layer="4512" from-port="2" to-layer="4514" to-port="0" /> <edge from-layer="4513" from-port="0" to-layer="4514" to-port="1" /> <edge from-layer="4514" from-port="2" to-layer="4515" to-port="0" /> <edge from-layer="4515" from-port="1" to-layer="4516" to-port="1" /> <edge from-layer="4516" from-port="2" to-layer="4517" to-port="1" /> <edge from-layer="4517" from-port="2" to-layer="4518" to-port="1" /> <edge from-layer="4518" from-port="2" to-layer="4537" to-port="0" /> <edge from-layer="4518" from-port="2" to-layer="4527" to-port="0" /> <edge from-layer="4519" from-port="0" to-layer="4520" to-port="0" /> <edge from-layer="4520" from-port="1" to-layer="4523" to-port="0" /> <edge from-layer="4521" from-port="0" to-layer="4522" to-port="0" /> <edge from-layer="4522" from-port="1" to-layer="4523" to-port="1" /> <edge from-layer="4523" from-port="2" to-layer="4525" to-port="0" /> <edge from-layer="4524" from-port="0" to-layer="4525" to-port="1" /> <edge from-layer="4525" from-port="2" to-layer="4526" to-port="0" /> <edge from-layer="4526" from-port="1" to-layer="4527" to-port="1" /> <edge from-layer="4527" from-port="2" to-layer="4528" to-port="0" /> <edge from-layer="4528" from-port="1" to-layer="4538" to-port="0" /> <edge from-layer="4529" from-port="0" to-layer="4530" to-port="0" /> <edge from-layer="4530" from-port="1" to-layer="4533" to-port="0" /> <edge from-layer="4531" from-port="0" to-layer="4532" to-port="0" /> <edge from-layer="4532" from-port="1" to-layer="4533" to-port="1" /> <edge from-layer="4533" from-port="2" to-layer="4535" to-port="0" /> <edge from-layer="4534" from-port="0" to-layer="4535" to-port="1" /> <edge from-layer="4535" from-port="2" to-layer="4536" to-port="0" /> <edge from-layer="4536" from-port="1" to-layer="4537" to-port="1" /> <edge from-layer="4537" from-port="2" to-layer="4538" to-port="1" /> <edge from-layer="4538" from-port="2" to-layer="4547" to-port="0" /> <edge from-layer="4539" from-port="0" to-layer="4540" to-port="0" /> <edge from-layer="4540" from-port="1" to-layer="4543" to-port="0" /> <edge from-layer="4541" from-port="0" to-layer="4542" to-port="0" /> <edge from-layer="4542" from-port="1" to-layer="4543" to-port="1" /> <edge from-layer="4543" from-port="2" to-layer="4545" to-port="0" /> <edge from-layer="4544" from-port="0" to-layer="4545" to-port="1" /> <edge from-layer="4545" from-port="2" to-layer="4546" to-port="0" /> <edge from-layer="4546" from-port="1" to-layer="4547" to-port="1" /> <edge from-layer="4547" from-port="2" to-layer="4548" to-port="1" /> <edge from-layer="4548" from-port="2" to-layer="4552" to-port="0" /> <edge from-layer="4548" from-port="2" to-layer="4657" to-port="0" /> <edge from-layer="4548" from-port="2" to-layer="4559" to-port="0" /> <edge from-layer="4549" from-port="0" to-layer="4560" to-port="0" /> <edge from-layer="4550" from-port="0" to-layer="4558" to-port="0" /> <edge from-layer="4551" from-port="0" to-layer="4552" to-port="1" /> <edge from-layer="4552" from-port="2" to-layer="4554" to-port="0" /> <edge from-layer="4553" from-port="0" to-layer="4554" to-port="1" /> <edge from-layer="4554" from-port="2" to-layer="4556" to-port="0" /> <edge from-layer="4555" from-port="0" to-layer="4556" to-port="1" /> <edge from-layer="4556" from-port="2" to-layer="4557" to-port="0" /> <edge from-layer="4557" from-port="1" to-layer="4558" to-port="1" /> <edge from-layer="4558" from-port="2" to-layer="4559" to-port="1" /> <edge from-layer="4559" from-port="2" to-layer="4560" to-port="1" /> <edge from-layer="4560" from-port="2" to-layer="4599" to-port="0" /> <edge from-layer="4560" from-port="2" to-layer="4634" to-port="0" /> <edge from-layer="4560" from-port="2" to-layer="4569" to-port="0" /> <edge from-layer="4561" from-port="0" to-layer="4562" to-port="0" /> <edge from-layer="4562" from-port="1" to-layer="4565" to-port="0" /> <edge from-layer="4563" from-port="0" to-layer="4564" to-port="0" /> <edge from-layer="4564" from-port="1" to-layer="4565" to-port="1" /> <edge from-layer="4565" from-port="2" to-layer="4567" to-port="0" /> <edge from-layer="4566" from-port="0" to-layer="4567" to-port="1" /> <edge from-layer="4567" from-port="2" to-layer="4568" to-port="0" /> <edge from-layer="4568" from-port="1" to-layer="4569" to-port="1" /> <edge from-layer="4569" from-port="2" to-layer="4571" to-port="0" /> <edge from-layer="4570" from-port="0" to-layer="4571" to-port="1" /> <edge from-layer="4571" from-port="2" to-layer="4573" to-port="0" /> <edge from-layer="4572" from-port="0" to-layer="4573" to-port="1" /> <edge from-layer="4573" from-port="2" to-layer="4574" to-port="0" /> <edge from-layer="4573" from-port="2" to-layer="4584" to-port="0" /> <edge from-layer="4573" from-port="2" to-layer="4578" to-port="0" /> <edge from-layer="4574" from-port="2" to-layer="4587" to-port="0" /> <edge from-layer="4575" from-port="0" to-layer="4578" to-port="1" /> <edge from-layer="4576" from-port="0" to-layer="4578" to-port="2" /> <edge from-layer="4577" from-port="0" to-layer="4578" to-port="3" /> <edge from-layer="4578" from-port="5" to-layer="4580" to-port="0" /> <edge from-layer="4579" from-port="0" to-layer="4580" to-port="1" /> <edge from-layer="4580" from-port="2" to-layer="4585" to-port="0" /> <edge from-layer="4581" from-port="0" to-layer="4584" to-port="1" /> <edge from-layer="4582" from-port="0" to-layer="4584" to-port="2" /> <edge from-layer="4583" from-port="0" to-layer="4584" to-port="3" /> <edge from-layer="4584" from-port="5" to-layer="4585" to-port="1" /> <edge from-layer="4585" from-port="2" to-layer="4586" to-port="0" /> <edge from-layer="4586" from-port="2" to-layer="4587" to-port="1" /> <edge from-layer="4587" from-port="2" to-layer="4644" to-port="0" /> <edge from-layer="4588" from-port="1" to-layer="4590" to-port="0" /> <edge from-layer="4589" from-port="0" to-layer="4590" to-port="2" /> <edge from-layer="4590" from-port="3" to-layer="4618" to-port="0" /> <edge from-layer="4591" from-port="0" to-layer="4592" to-port="0" /> <edge from-layer="4592" from-port="1" to-layer="4595" to-port="0" /> <edge from-layer="4593" from-port="0" to-layer="4594" to-port="0" /> <edge from-layer="4594" from-port="1" to-layer="4595" to-port="1" /> <edge from-layer="4595" from-port="2" to-layer="4597" to-port="0" /> <edge from-layer="4596" from-port="0" to-layer="4597" to-port="1" /> <edge from-layer="4597" from-port="2" to-layer="4598" to-port="0" /> <edge from-layer="4598" from-port="1" to-layer="4599" to-port="1" /> <edge from-layer="4599" from-port="2" to-layer="4601" to-port="0" /> <edge from-layer="4600" from-port="0" to-layer="4601" to-port="1" /> <edge from-layer="4601" from-port="2" to-layer="4603" to-port="0" /> <edge from-layer="4602" from-port="0" to-layer="4603" to-port="1" /> <edge from-layer="4603" from-port="2" to-layer="4614" to-port="0" /> <edge from-layer="4603" from-port="2" to-layer="4604" to-port="0" /> <edge from-layer="4603" from-port="2" to-layer="4608" to-port="0" /> <edge from-layer="4604" from-port="2" to-layer="4617" to-port="0" /> <edge from-layer="4605" from-port="0" to-layer="4608" to-port="1" /> <edge from-layer="4606" from-port="0" to-layer="4608" to-port="2" /> <edge from-layer="4607" from-port="0" to-layer="4608" to-port="3" /> <edge from-layer="4608" from-port="5" to-layer="4610" to-port="0" /> <edge from-layer="4609" from-port="0" to-layer="4610" to-port="1" /> <edge from-layer="4610" from-port="2" to-layer="4615" to-port="0" /> <edge from-layer="4611" from-port="0" to-layer="4614" to-port="1" /> <edge from-layer="4612" from-port="0" to-layer="4614" to-port="2" /> <edge from-layer="4613" from-port="0" to-layer="4614" to-port="3" /> <edge from-layer="4614" from-port="5" to-layer="4615" to-port="1" /> <edge from-layer="4615" from-port="2" to-layer="4616" to-port="0" /> <edge from-layer="4616" from-port="2" to-layer="4617" to-port="1" /> <edge from-layer="4617" from-port="2" to-layer="4618" to-port="1" /> <edge from-layer="4618" from-port="2" to-layer="6138" to-port="0" /> <edge from-layer="4618" from-port="2" to-layer="4619" to-port="0" /> <edge from-layer="4619" from-port="2" to-layer="4620" to-port="0" /> <edge from-layer="4620" from-port="2" to-layer="4622" to-port="0" /> <edge from-layer="4621" from-port="0" to-layer="4622" to-port="1" /> <edge from-layer="4622" from-port="2" to-layer="4644" to-port="1" /> <edge from-layer="4623" from-port="1" to-layer="4625" to-port="0" /> <edge from-layer="4624" from-port="0" to-layer="4625" to-port="2" /> <edge from-layer="4625" from-port="3" to-layer="4639" to-port="0" /> <edge from-layer="4626" from-port="0" to-layer="4627" to-port="0" /> <edge from-layer="4627" from-port="1" to-layer="4630" to-port="0" /> <edge from-layer="4628" from-port="0" to-layer="4629" to-port="0" /> <edge from-layer="4629" from-port="1" to-layer="4630" to-port="1" /> <edge from-layer="4630" from-port="2" to-layer="4632" to-port="0" /> <edge from-layer="4631" from-port="0" to-layer="4632" to-port="1" /> <edge from-layer="4632" from-port="2" to-layer="4633" to-port="0" /> <edge from-layer="4633" from-port="1" to-layer="4634" to-port="1" /> <edge from-layer="4634" from-port="2" to-layer="4636" to-port="0" /> <edge from-layer="4635" from-port="0" to-layer="4636" to-port="1" /> <edge from-layer="4636" from-port="2" to-layer="4638" to-port="0" /> <edge from-layer="4637" from-port="0" to-layer="4638" to-port="1" /> <edge from-layer="4638" from-port="2" to-layer="4639" to-port="1" /> <edge from-layer="4639" from-port="2" to-layer="4640" to-port="0" /> <edge from-layer="4639" from-port="2" to-layer="6137" to-port="0" /> <edge from-layer="4640" from-port="2" to-layer="4641" to-port="0" /> <edge from-layer="4641" from-port="2" to-layer="4643" to-port="0" /> <edge from-layer="4642" from-port="0" to-layer="4643" to-port="1" /> <edge from-layer="4643" from-port="2" to-layer="4644" to-port="2" /> <edge from-layer="4644" from-port="4" to-layer="4646" to-port="0" /> <edge from-layer="4645" from-port="0" to-layer="4646" to-port="1" /> <edge from-layer="4646" from-port="2" to-layer="4647" to-port="0" /> <edge from-layer="4647" from-port="2" to-layer="4656" to-port="0" /> <edge from-layer="4648" from-port="0" to-layer="4649" to-port="0" /> <edge from-layer="4649" from-port="1" to-layer="4652" to-port="0" /> <edge from-layer="4650" from-port="0" to-layer="4651" to-port="0" /> <edge from-layer="4651" from-port="1" to-layer="4652" to-port="1" /> <edge from-layer="4652" from-port="2" to-layer="4654" to-port="0" /> <edge from-layer="4653" from-port="0" to-layer="4654" to-port="1" /> <edge from-layer="4654" from-port="2" to-layer="4655" to-port="0" /> <edge from-layer="4655" from-port="1" to-layer="4656" to-port="1" /> <edge from-layer="4656" from-port="2" to-layer="4657" to-port="1" /> <edge from-layer="4657" from-port="2" to-layer="4661" to-port="0" /> <edge from-layer="4657" from-port="2" to-layer="4699" to-port="0" /> <edge from-layer="4657" from-port="2" to-layer="4668" to-port="0" /> <edge from-layer="4658" from-port="0" to-layer="4669" to-port="0" /> <edge from-layer="4659" from-port="0" to-layer="4667" to-port="0" /> <edge from-layer="4660" from-port="0" to-layer="4661" to-port="1" /> <edge from-layer="4661" from-port="2" to-layer="4663" to-port="0" /> <edge from-layer="4662" from-port="0" to-layer="4663" to-port="1" /> <edge from-layer="4663" from-port="2" to-layer="4665" to-port="0" /> <edge from-layer="4664" from-port="0" to-layer="4665" to-port="1" /> <edge from-layer="4665" from-port="2" to-layer="4666" to-port="0" /> <edge from-layer="4666" from-port="1" to-layer="4667" to-port="1" /> <edge from-layer="4667" from-port="2" to-layer="4668" to-port="1" /> <edge from-layer="4668" from-port="2" to-layer="4669" to-port="1" /> <edge from-layer="4669" from-port="2" to-layer="4678" to-port="0" /> <edge from-layer="4669" from-port="2" to-layer="4688" to-port="0" /> <edge from-layer="4670" from-port="0" to-layer="4671" to-port="0" /> <edge from-layer="4671" from-port="1" to-layer="4674" to-port="0" /> <edge from-layer="4672" from-port="0" to-layer="4673" to-port="0" /> <edge from-layer="4673" from-port="1" to-layer="4674" to-port="1" /> <edge from-layer="4674" from-port="2" to-layer="4676" to-port="0" /> <edge from-layer="4675" from-port="0" to-layer="4676" to-port="1" /> <edge from-layer="4676" from-port="2" to-layer="4677" to-port="0" /> <edge from-layer="4677" from-port="1" to-layer="4678" to-port="1" /> <edge from-layer="4678" from-port="2" to-layer="4679" to-port="0" /> <edge from-layer="4679" from-port="1" to-layer="4689" to-port="0" /> <edge from-layer="4680" from-port="0" to-layer="4681" to-port="0" /> <edge from-layer="4681" from-port="1" to-layer="4684" to-port="0" /> <edge from-layer="4682" from-port="0" to-layer="4683" to-port="0" /> <edge from-layer="4683" from-port="1" to-layer="4684" to-port="1" /> <edge from-layer="4684" from-port="2" to-layer="4686" to-port="0" /> <edge from-layer="4685" from-port="0" to-layer="4686" to-port="1" /> <edge from-layer="4686" from-port="2" to-layer="4687" to-port="0" /> <edge from-layer="4687" from-port="1" to-layer="4688" to-port="1" /> <edge from-layer="4688" from-port="2" to-layer="4689" to-port="1" /> <edge from-layer="4689" from-port="2" to-layer="4698" to-port="0" /> <edge from-layer="4690" from-port="0" to-layer="4691" to-port="0" /> <edge from-layer="4691" from-port="1" to-layer="4694" to-port="0" /> <edge from-layer="4692" from-port="0" to-layer="4693" to-port="0" /> <edge from-layer="4693" from-port="1" to-layer="4694" to-port="1" /> <edge from-layer="4694" from-port="2" to-layer="4696" to-port="0" /> <edge from-layer="4695" from-port="0" to-layer="4696" to-port="1" /> <edge from-layer="4696" from-port="2" to-layer="4697" to-port="0" /> <edge from-layer="4697" from-port="1" to-layer="4698" to-port="1" /> <edge from-layer="4698" from-port="2" to-layer="4699" to-port="1" /> <edge from-layer="4699" from-port="2" to-layer="4808" to-port="0" /> <edge from-layer="4699" from-port="2" to-layer="4703" to-port="0" /> <edge from-layer="4699" from-port="2" to-layer="4710" to-port="0" /> <edge from-layer="4700" from-port="0" to-layer="4711" to-port="0" /> <edge from-layer="4701" from-port="0" to-layer="4709" to-port="0" /> <edge from-layer="4702" from-port="0" to-layer="4703" to-port="1" /> <edge from-layer="4703" from-port="2" to-layer="4705" to-port="0" /> <edge from-layer="4704" from-port="0" to-layer="4705" to-port="1" /> <edge from-layer="4705" from-port="2" to-layer="4707" to-port="0" /> <edge from-layer="4706" from-port="0" to-layer="4707" to-port="1" /> <edge from-layer="4707" from-port="2" to-layer="4708" to-port="0" /> <edge from-layer="4708" from-port="1" to-layer="4709" to-port="1" /> <edge from-layer="4709" from-port="2" to-layer="4710" to-port="1" /> <edge from-layer="4710" from-port="2" to-layer="4711" to-port="1" /> <edge from-layer="4711" from-port="2" to-layer="4750" to-port="0" /> <edge from-layer="4711" from-port="2" to-layer="4785" to-port="0" /> <edge from-layer="4711" from-port="2" to-layer="4720" to-port="0" /> <edge from-layer="4712" from-port="0" to-layer="4713" to-port="0" /> <edge from-layer="4713" from-port="1" to-layer="4716" to-port="0" /> <edge from-layer="4714" from-port="0" to-layer="4715" to-port="0" /> <edge from-layer="4715" from-port="1" to-layer="4716" to-port="1" /> <edge from-layer="4716" from-port="2" to-layer="4718" to-port="0" /> <edge from-layer="4717" from-port="0" to-layer="4718" to-port="1" /> <edge from-layer="4718" from-port="2" to-layer="4719" to-port="0" /> <edge from-layer="4719" from-port="1" to-layer="4720" to-port="1" /> <edge from-layer="4720" from-port="2" to-layer="4722" to-port="0" /> <edge from-layer="4721" from-port="0" to-layer="4722" to-port="1" /> <edge from-layer="4722" from-port="2" to-layer="4724" to-port="0" /> <edge from-layer="4723" from-port="0" to-layer="4724" to-port="1" /> <edge from-layer="4724" from-port="2" to-layer="4725" to-port="0" /> <edge from-layer="4724" from-port="2" to-layer="4729" to-port="0" /> <edge from-layer="4724" from-port="2" to-layer="4735" to-port="0" /> <edge from-layer="4725" from-port="2" to-layer="4738" to-port="0" /> <edge from-layer="4726" from-port="0" to-layer="4729" to-port="1" /> <edge from-layer="4727" from-port="0" to-layer="4729" to-port="2" /> <edge from-layer="4728" from-port="0" to-layer="4729" to-port="3" /> <edge from-layer="4729" from-port="5" to-layer="4731" to-port="0" /> <edge from-layer="4730" from-port="0" to-layer="4731" to-port="1" /> <edge from-layer="4731" from-port="2" to-layer="4736" to-port="0" /> <edge from-layer="4732" from-port="0" to-layer="4735" to-port="1" /> <edge from-layer="4733" from-port="0" to-layer="4735" to-port="2" /> <edge from-layer="4734" from-port="0" to-layer="4735" to-port="3" /> <edge from-layer="4735" from-port="5" to-layer="4736" to-port="1" /> <edge from-layer="4736" from-port="2" to-layer="4737" to-port="0" /> <edge from-layer="4737" from-port="2" to-layer="4738" to-port="1" /> <edge from-layer="4738" from-port="2" to-layer="4795" to-port="0" /> <edge from-layer="4739" from-port="1" to-layer="4741" to-port="0" /> <edge from-layer="4740" from-port="0" to-layer="4741" to-port="2" /> <edge from-layer="4741" from-port="3" to-layer="4769" to-port="0" /> <edge from-layer="4742" from-port="0" to-layer="4743" to-port="0" /> <edge from-layer="4743" from-port="1" to-layer="4746" to-port="0" /> <edge from-layer="4744" from-port="0" to-layer="4745" to-port="0" /> <edge from-layer="4745" from-port="1" to-layer="4746" to-port="1" /> <edge from-layer="4746" from-port="2" to-layer="4748" to-port="0" /> <edge from-layer="4747" from-port="0" to-layer="4748" to-port="1" /> <edge from-layer="4748" from-port="2" to-layer="4749" to-port="0" /> <edge from-layer="4749" from-port="1" to-layer="4750" to-port="1" /> <edge from-layer="4750" from-port="2" to-layer="4752" to-port="0" /> <edge from-layer="4751" from-port="0" to-layer="4752" to-port="1" /> <edge from-layer="4752" from-port="2" to-layer="4754" to-port="0" /> <edge from-layer="4753" from-port="0" to-layer="4754" to-port="1" /> <edge from-layer="4754" from-port="2" to-layer="4755" to-port="0" /> <edge from-layer="4754" from-port="2" to-layer="4759" to-port="0" /> <edge from-layer="4754" from-port="2" to-layer="4765" to-port="0" /> <edge from-layer="4755" from-port="2" to-layer="4768" to-port="0" /> <edge from-layer="4756" from-port="0" to-layer="4759" to-port="1" /> <edge from-layer="4757" from-port="0" to-layer="4759" to-port="2" /> <edge from-layer="4758" from-port="0" to-layer="4759" to-port="3" /> <edge from-layer="4759" from-port="5" to-layer="4761" to-port="0" /> <edge from-layer="4760" from-port="0" to-layer="4761" to-port="1" /> <edge from-layer="4761" from-port="2" to-layer="4766" to-port="0" /> <edge from-layer="4762" from-port="0" to-layer="4765" to-port="1" /> <edge from-layer="4763" from-port="0" to-layer="4765" to-port="2" /> <edge from-layer="4764" from-port="0" to-layer="4765" to-port="3" /> <edge from-layer="4765" from-port="5" to-layer="4766" to-port="1" /> <edge from-layer="4766" from-port="2" to-layer="4767" to-port="0" /> <edge from-layer="4767" from-port="2" to-layer="4768" to-port="1" /> <edge from-layer="4768" from-port="2" to-layer="4769" to-port="1" /> <edge from-layer="4769" from-port="2" to-layer="6134" to-port="0" /> <edge from-layer="4769" from-port="2" to-layer="4770" to-port="0" /> <edge from-layer="4770" from-port="2" to-layer="4771" to-port="0" /> <edge from-layer="4771" from-port="2" to-layer="4773" to-port="0" /> <edge from-layer="4772" from-port="0" to-layer="4773" to-port="1" /> <edge from-layer="4773" from-port="2" to-layer="4795" to-port="1" /> <edge from-layer="4774" from-port="1" to-layer="4776" to-port="0" /> <edge from-layer="4775" from-port="0" to-layer="4776" to-port="2" /> <edge from-layer="4776" from-port="3" to-layer="4790" to-port="0" /> <edge from-layer="4777" from-port="0" to-layer="4778" to-port="0" /> <edge from-layer="4778" from-port="1" to-layer="4781" to-port="0" /> <edge from-layer="4779" from-port="0" to-layer="4780" to-port="0" /> <edge from-layer="4780" from-port="1" to-layer="4781" to-port="1" /> <edge from-layer="4781" from-port="2" to-layer="4783" to-port="0" /> <edge from-layer="4782" from-port="0" to-layer="4783" to-port="1" /> <edge from-layer="4783" from-port="2" to-layer="4784" to-port="0" /> <edge from-layer="4784" from-port="1" to-layer="4785" to-port="1" /> <edge from-layer="4785" from-port="2" to-layer="4787" to-port="0" /> <edge from-layer="4786" from-port="0" to-layer="4787" to-port="1" /> <edge from-layer="4787" from-port="2" to-layer="4789" to-port="0" /> <edge from-layer="4788" from-port="0" to-layer="4789" to-port="1" /> <edge from-layer="4789" from-port="2" to-layer="4790" to-port="1" /> <edge from-layer="4790" from-port="2" to-layer="4791" to-port="0" /> <edge from-layer="4790" from-port="2" to-layer="6133" to-port="0" /> <edge from-layer="4791" from-port="2" to-layer="4792" to-port="0" /> <edge from-layer="4792" from-port="2" to-layer="4794" to-port="0" /> <edge from-layer="4793" from-port="0" to-layer="4794" to-port="1" /> <edge from-layer="4794" from-port="2" to-layer="4795" to-port="2" /> <edge from-layer="4795" from-port="4" to-layer="4797" to-port="0" /> <edge from-layer="4796" from-port="0" to-layer="4797" to-port="1" /> <edge from-layer="4797" from-port="2" to-layer="4798" to-port="0" /> <edge from-layer="4798" from-port="2" to-layer="4807" to-port="0" /> <edge from-layer="4799" from-port="0" to-layer="4800" to-port="0" /> <edge from-layer="4800" from-port="1" to-layer="4803" to-port="0" /> <edge from-layer="4801" from-port="0" to-layer="4802" to-port="0" /> <edge from-layer="4802" from-port="1" to-layer="4803" to-port="1" /> <edge from-layer="4803" from-port="2" to-layer="4805" to-port="0" /> <edge from-layer="4804" from-port="0" to-layer="4805" to-port="1" /> <edge from-layer="4805" from-port="2" to-layer="4806" to-port="0" /> <edge from-layer="4806" from-port="1" to-layer="4807" to-port="1" /> <edge from-layer="4807" from-port="2" to-layer="4808" to-port="1" /> <edge from-layer="4808" from-port="2" to-layer="4812" to-port="0" /> <edge from-layer="4808" from-port="2" to-layer="4850" to-port="0" /> <edge from-layer="4808" from-port="2" to-layer="4819" to-port="0" /> <edge from-layer="4809" from-port="0" to-layer="4820" to-port="0" /> <edge from-layer="4810" from-port="0" to-layer="4818" to-port="0" /> <edge from-layer="4811" from-port="0" to-layer="4812" to-port="1" /> <edge from-layer="4812" from-port="2" to-layer="4814" to-port="0" /> <edge from-layer="4813" from-port="0" to-layer="4814" to-port="1" /> <edge from-layer="4814" from-port="2" to-layer="4816" to-port="0" /> <edge from-layer="4815" from-port="0" to-layer="4816" to-port="1" /> <edge from-layer="4816" from-port="2" to-layer="4817" to-port="0" /> <edge from-layer="4817" from-port="1" to-layer="4818" to-port="1" /> <edge from-layer="4818" from-port="2" to-layer="4819" to-port="1" /> <edge from-layer="4819" from-port="2" to-layer="4820" to-port="1" /> <edge from-layer="4820" from-port="2" to-layer="4839" to-port="0" /> <edge from-layer="4820" from-port="2" to-layer="4829" to-port="0" /> <edge from-layer="4821" from-port="0" to-layer="4822" to-port="0" /> <edge from-layer="4822" from-port="1" to-layer="4825" to-port="0" /> <edge from-layer="4823" from-port="0" to-layer="4824" to-port="0" /> <edge from-layer="4824" from-port="1" to-layer="4825" to-port="1" /> <edge from-layer="4825" from-port="2" to-layer="4827" to-port="0" /> <edge from-layer="4826" from-port="0" to-layer="4827" to-port="1" /> <edge from-layer="4827" from-port="2" to-layer="4828" to-port="0" /> <edge from-layer="4828" from-port="1" to-layer="4829" to-port="1" /> <edge from-layer="4829" from-port="2" to-layer="4830" to-port="0" /> <edge from-layer="4830" from-port="1" to-layer="4840" to-port="0" /> <edge from-layer="4831" from-port="0" to-layer="4832" to-port="0" /> <edge from-layer="4832" from-port="1" to-layer="4835" to-port="0" /> <edge from-layer="4833" from-port="0" to-layer="4834" to-port="0" /> <edge from-layer="4834" from-port="1" to-layer="4835" to-port="1" /> <edge from-layer="4835" from-port="2" to-layer="4837" to-port="0" /> <edge from-layer="4836" from-port="0" to-layer="4837" to-port="1" /> <edge from-layer="4837" from-port="2" to-layer="4838" to-port="0" /> <edge from-layer="4838" from-port="1" to-layer="4839" to-port="1" /> <edge from-layer="4839" from-port="2" to-layer="4840" to-port="1" /> <edge from-layer="4840" from-port="2" to-layer="4849" to-port="0" /> <edge from-layer="4841" from-port="0" to-layer="4842" to-port="0" /> <edge from-layer="4842" from-port="1" to-layer="4845" to-port="0" /> <edge from-layer="4843" from-port="0" to-layer="4844" to-port="0" /> <edge from-layer="4844" from-port="1" to-layer="4845" to-port="1" /> <edge from-layer="4845" from-port="2" to-layer="4847" to-port="0" /> <edge from-layer="4846" from-port="0" to-layer="4847" to-port="1" /> <edge from-layer="4847" from-port="2" to-layer="4848" to-port="0" /> <edge from-layer="4848" from-port="1" to-layer="4849" to-port="1" /> <edge from-layer="4849" from-port="2" to-layer="4850" to-port="1" /> <edge from-layer="4850" from-port="2" to-layer="4959" to-port="0" /> <edge from-layer="4850" from-port="2" to-layer="4854" to-port="0" /> <edge from-layer="4850" from-port="2" to-layer="4861" to-port="0" /> <edge from-layer="4851" from-port="0" to-layer="4862" to-port="0" /> <edge from-layer="4852" from-port="0" to-layer="4860" to-port="0" /> <edge from-layer="4853" from-port="0" to-layer="4854" to-port="1" /> <edge from-layer="4854" from-port="2" to-layer="4856" to-port="0" /> <edge from-layer="4855" from-port="0" to-layer="4856" to-port="1" /> <edge from-layer="4856" from-port="2" to-layer="4858" to-port="0" /> <edge from-layer="4857" from-port="0" to-layer="4858" to-port="1" /> <edge from-layer="4858" from-port="2" to-layer="4859" to-port="0" /> <edge from-layer="4859" from-port="1" to-layer="4860" to-port="1" /> <edge from-layer="4860" from-port="2" to-layer="4861" to-port="1" /> <edge from-layer="4861" from-port="2" to-layer="4862" to-port="1" /> <edge from-layer="4862" from-port="2" to-layer="4936" to-port="0" /> <edge from-layer="4862" from-port="2" to-layer="4871" to-port="0" /> <edge from-layer="4862" from-port="2" to-layer="4901" to-port="0" /> <edge from-layer="4863" from-port="0" to-layer="4864" to-port="0" /> <edge from-layer="4864" from-port="1" to-layer="4867" to-port="0" /> <edge from-layer="4865" from-port="0" to-layer="4866" to-port="0" /> <edge from-layer="4866" from-port="1" to-layer="4867" to-port="1" /> <edge from-layer="4867" from-port="2" to-layer="4869" to-port="0" /> <edge from-layer="4868" from-port="0" to-layer="4869" to-port="1" /> <edge from-layer="4869" from-port="2" to-layer="4870" to-port="0" /> <edge from-layer="4870" from-port="1" to-layer="4871" to-port="1" /> <edge from-layer="4871" from-port="2" to-layer="4873" to-port="0" /> <edge from-layer="4872" from-port="0" to-layer="4873" to-port="1" /> <edge from-layer="4873" from-port="2" to-layer="4875" to-port="0" /> <edge from-layer="4874" from-port="0" to-layer="4875" to-port="1" /> <edge from-layer="4875" from-port="2" to-layer="4876" to-port="0" /> <edge from-layer="4875" from-port="2" to-layer="4880" to-port="0" /> <edge from-layer="4875" from-port="2" to-layer="4886" to-port="0" /> <edge from-layer="4876" from-port="2" to-layer="4889" to-port="0" /> <edge from-layer="4877" from-port="0" to-layer="4880" to-port="1" /> <edge from-layer="4878" from-port="0" to-layer="4880" to-port="2" /> <edge from-layer="4879" from-port="0" to-layer="4880" to-port="3" /> <edge from-layer="4880" from-port="5" to-layer="4882" to-port="0" /> <edge from-layer="4881" from-port="0" to-layer="4882" to-port="1" /> <edge from-layer="4882" from-port="2" to-layer="4887" to-port="0" /> <edge from-layer="4883" from-port="0" to-layer="4886" to-port="1" /> <edge from-layer="4884" from-port="0" to-layer="4886" to-port="2" /> <edge from-layer="4885" from-port="0" to-layer="4886" to-port="3" /> <edge from-layer="4886" from-port="5" to-layer="4887" to-port="1" /> <edge from-layer="4887" from-port="2" to-layer="4888" to-port="0" /> <edge from-layer="4888" from-port="2" to-layer="4889" to-port="1" /> <edge from-layer="4889" from-port="2" to-layer="4946" to-port="0" /> <edge from-layer="4890" from-port="1" to-layer="4892" to-port="0" /> <edge from-layer="4891" from-port="0" to-layer="4892" to-port="2" /> <edge from-layer="4892" from-port="3" to-layer="4920" to-port="0" /> <edge from-layer="4893" from-port="0" to-layer="4894" to-port="0" /> <edge from-layer="4894" from-port="1" to-layer="4897" to-port="0" /> <edge from-layer="4895" from-port="0" to-layer="4896" to-port="0" /> <edge from-layer="4896" from-port="1" to-layer="4897" to-port="1" /> <edge from-layer="4897" from-port="2" to-layer="4899" to-port="0" /> <edge from-layer="4898" from-port="0" to-layer="4899" to-port="1" /> <edge from-layer="4899" from-port="2" to-layer="4900" to-port="0" /> <edge from-layer="4900" from-port="1" to-layer="4901" to-port="1" /> <edge from-layer="4901" from-port="2" to-layer="4903" to-port="0" /> <edge from-layer="4902" from-port="0" to-layer="4903" to-port="1" /> <edge from-layer="4903" from-port="2" to-layer="4905" to-port="0" /> <edge from-layer="4904" from-port="0" to-layer="4905" to-port="1" /> <edge from-layer="4905" from-port="2" to-layer="4916" to-port="0" /> <edge from-layer="4905" from-port="2" to-layer="4906" to-port="0" /> <edge from-layer="4905" from-port="2" to-layer="4910" to-port="0" /> <edge from-layer="4906" from-port="2" to-layer="4919" to-port="0" /> <edge from-layer="4907" from-port="0" to-layer="4910" to-port="1" /> <edge from-layer="4908" from-port="0" to-layer="4910" to-port="2" /> <edge from-layer="4909" from-port="0" to-layer="4910" to-port="3" /> <edge from-layer="4910" from-port="5" to-layer="4912" to-port="0" /> <edge from-layer="4911" from-port="0" to-layer="4912" to-port="1" /> <edge from-layer="4912" from-port="2" to-layer="4917" to-port="0" /> <edge from-layer="4913" from-port="0" to-layer="4916" to-port="1" /> <edge from-layer="4914" from-port="0" to-layer="4916" to-port="2" /> <edge from-layer="4915" from-port="0" to-layer="4916" to-port="3" /> <edge from-layer="4916" from-port="5" to-layer="4917" to-port="1" /> <edge from-layer="4917" from-port="2" to-layer="4918" to-port="0" /> <edge from-layer="4918" from-port="2" to-layer="4919" to-port="1" /> <edge from-layer="4919" from-port="2" to-layer="4920" to-port="1" /> <edge from-layer="4920" from-port="2" to-layer="6132" to-port="0" /> <edge from-layer="4920" from-port="2" to-layer="4921" to-port="0" /> <edge from-layer="4921" from-port="2" to-layer="4922" to-port="0" /> <edge from-layer="4922" from-port="2" to-layer="4924" to-port="0" /> <edge from-layer="4923" from-port="0" to-layer="4924" to-port="1" /> <edge from-layer="4924" from-port="2" to-layer="4946" to-port="1" /> <edge from-layer="4925" from-port="1" to-layer="4927" to-port="0" /> <edge from-layer="4926" from-port="0" to-layer="4927" to-port="2" /> <edge from-layer="4927" from-port="3" to-layer="4941" to-port="0" /> <edge from-layer="4928" from-port="0" to-layer="4929" to-port="0" /> <edge from-layer="4929" from-port="1" to-layer="4932" to-port="0" /> <edge from-layer="4930" from-port="0" to-layer="4931" to-port="0" /> <edge from-layer="4931" from-port="1" to-layer="4932" to-port="1" /> <edge from-layer="4932" from-port="2" to-layer="4934" to-port="0" /> <edge from-layer="4933" from-port="0" to-layer="4934" to-port="1" /> <edge from-layer="4934" from-port="2" to-layer="4935" to-port="0" /> <edge from-layer="4935" from-port="1" to-layer="4936" to-port="1" /> <edge from-layer="4936" from-port="2" to-layer="4938" to-port="0" /> <edge from-layer="4937" from-port="0" to-layer="4938" to-port="1" /> <edge from-layer="4938" from-port="2" to-layer="4940" to-port="0" /> <edge from-layer="4939" from-port="0" to-layer="4940" to-port="1" /> <edge from-layer="4940" from-port="2" to-layer="4941" to-port="1" /> <edge from-layer="4941" from-port="2" to-layer="6131" to-port="0" /> <edge from-layer="4941" from-port="2" to-layer="4942" to-port="0" /> <edge from-layer="4942" from-port="2" to-layer="4943" to-port="0" /> <edge from-layer="4943" from-port="2" to-layer="4945" to-port="0" /> <edge from-layer="4944" from-port="0" to-layer="4945" to-port="1" /> <edge from-layer="4945" from-port="2" to-layer="4946" to-port="2" /> <edge from-layer="4946" from-port="4" to-layer="4948" to-port="0" /> <edge from-layer="4947" from-port="0" to-layer="4948" to-port="1" /> <edge from-layer="4948" from-port="2" to-layer="4949" to-port="0" /> <edge from-layer="4949" from-port="2" to-layer="4958" to-port="0" /> <edge from-layer="4950" from-port="0" to-layer="4951" to-port="0" /> <edge from-layer="4951" from-port="1" to-layer="4954" to-port="0" /> <edge from-layer="4952" from-port="0" to-layer="4953" to-port="0" /> <edge from-layer="4953" from-port="1" to-layer="4954" to-port="1" /> <edge from-layer="4954" from-port="2" to-layer="4956" to-port="0" /> <edge from-layer="4955" from-port="0" to-layer="4956" to-port="1" /> <edge from-layer="4956" from-port="2" to-layer="4957" to-port="0" /> <edge from-layer="4957" from-port="1" to-layer="4958" to-port="1" /> <edge from-layer="4958" from-port="2" to-layer="4959" to-port="1" /> <edge from-layer="4959" from-port="2" to-layer="5001" to-port="0" /> <edge from-layer="4959" from-port="2" to-layer="4970" to-port="0" /> <edge from-layer="4959" from-port="2" to-layer="4963" to-port="0" /> <edge from-layer="4960" from-port="0" to-layer="4971" to-port="0" /> <edge from-layer="4961" from-port="0" to-layer="4969" to-port="0" /> <edge from-layer="4962" from-port="0" to-layer="4963" to-port="1" /> <edge from-layer="4963" from-port="2" to-layer="4965" to-port="0" /> <edge from-layer="4964" from-port="0" to-layer="4965" to-port="1" /> <edge from-layer="4965" from-port="2" to-layer="4967" to-port="0" /> <edge from-layer="4966" from-port="0" to-layer="4967" to-port="1" /> <edge from-layer="4967" from-port="2" to-layer="4968" to-port="0" /> <edge from-layer="4968" from-port="1" to-layer="4969" to-port="1" /> <edge from-layer="4969" from-port="2" to-layer="4970" to-port="1" /> <edge from-layer="4970" from-port="2" to-layer="4971" to-port="1" /> <edge from-layer="4971" from-port="2" to-layer="4990" to-port="0" /> <edge from-layer="4971" from-port="2" to-layer="4980" to-port="0" /> <edge from-layer="4972" from-port="0" to-layer="4973" to-port="0" /> <edge from-layer="4973" from-port="1" to-layer="4976" to-port="0" /> <edge from-layer="4974" from-port="0" to-layer="4975" to-port="0" /> <edge from-layer="4975" from-port="1" to-layer="4976" to-port="1" /> <edge from-layer="4976" from-port="2" to-layer="4978" to-port="0" /> <edge from-layer="4977" from-port="0" to-layer="4978" to-port="1" /> <edge from-layer="4978" from-port="2" to-layer="4979" to-port="0" /> <edge from-layer="4979" from-port="1" to-layer="4980" to-port="1" /> <edge from-layer="4980" from-port="2" to-layer="4981" to-port="0" /> <edge from-layer="4981" from-port="1" to-layer="4991" to-port="0" /> <edge from-layer="4982" from-port="0" to-layer="4983" to-port="0" /> <edge from-layer="4983" from-port="1" to-layer="4986" to-port="0" /> <edge from-layer="4984" from-port="0" to-layer="4985" to-port="0" /> <edge from-layer="4985" from-port="1" to-layer="4986" to-port="1" /> <edge from-layer="4986" from-port="2" to-layer="4988" to-port="0" /> <edge from-layer="4987" from-port="0" to-layer="4988" to-port="1" /> <edge from-layer="4988" from-port="2" to-layer="4989" to-port="0" /> <edge from-layer="4989" from-port="1" to-layer="4990" to-port="1" /> <edge from-layer="4990" from-port="2" to-layer="4991" to-port="1" /> <edge from-layer="4991" from-port="2" to-layer="5000" to-port="0" /> <edge from-layer="4992" from-port="0" to-layer="4993" to-port="0" /> <edge from-layer="4993" from-port="1" to-layer="4996" to-port="0" /> <edge from-layer="4994" from-port="0" to-layer="4995" to-port="0" /> <edge from-layer="4995" from-port="1" to-layer="4996" to-port="1" /> <edge from-layer="4996" from-port="2" to-layer="4998" to-port="0" /> <edge from-layer="4997" from-port="0" to-layer="4998" to-port="1" /> <edge from-layer="4998" from-port="2" to-layer="4999" to-port="0" /> <edge from-layer="4999" from-port="1" to-layer="5000" to-port="1" /> <edge from-layer="5000" from-port="2" to-layer="5001" to-port="1" /> <edge from-layer="5001" from-port="2" to-layer="5110" to-port="0" /> <edge from-layer="5001" from-port="2" to-layer="5012" to-port="0" /> <edge from-layer="5001" from-port="2" to-layer="5005" to-port="0" /> <edge from-layer="5002" from-port="0" to-layer="5013" to-port="0" /> <edge from-layer="5003" from-port="0" to-layer="5011" to-port="0" /> <edge from-layer="5004" from-port="0" to-layer="5005" to-port="1" /> <edge from-layer="5005" from-port="2" to-layer="5007" to-port="0" /> <edge from-layer="5006" from-port="0" to-layer="5007" to-port="1" /> <edge from-layer="5007" from-port="2" to-layer="5009" to-port="0" /> <edge from-layer="5008" from-port="0" to-layer="5009" to-port="1" /> <edge from-layer="5009" from-port="2" to-layer="5010" to-port="0" /> <edge from-layer="5010" from-port="1" to-layer="5011" to-port="1" /> <edge from-layer="5011" from-port="2" to-layer="5012" to-port="1" /> <edge from-layer="5012" from-port="2" to-layer="5013" to-port="1" /> <edge from-layer="5013" from-port="2" to-layer="5022" to-port="0" /> <edge from-layer="5013" from-port="2" to-layer="5052" to-port="0" /> <edge from-layer="5013" from-port="2" to-layer="5087" to-port="0" /> <edge from-layer="5014" from-port="0" to-layer="5015" to-port="0" /> <edge from-layer="5015" from-port="1" to-layer="5018" to-port="0" /> <edge from-layer="5016" from-port="0" to-layer="5017" to-port="0" /> <edge from-layer="5017" from-port="1" to-layer="5018" to-port="1" /> <edge from-layer="5018" from-port="2" to-layer="5020" to-port="0" /> <edge from-layer="5019" from-port="0" to-layer="5020" to-port="1" /> <edge from-layer="5020" from-port="2" to-layer="5021" to-port="0" /> <edge from-layer="5021" from-port="1" to-layer="5022" to-port="1" /> <edge from-layer="5022" from-port="2" to-layer="5024" to-port="0" /> <edge from-layer="5023" from-port="0" to-layer="5024" to-port="1" /> <edge from-layer="5024" from-port="2" to-layer="5026" to-port="0" /> <edge from-layer="5025" from-port="0" to-layer="5026" to-port="1" /> <edge from-layer="5026" from-port="2" to-layer="5027" to-port="0" /> <edge from-layer="5026" from-port="2" to-layer="5037" to-port="0" /> <edge from-layer="5026" from-port="2" to-layer="5031" to-port="0" /> <edge from-layer="5027" from-port="2" to-layer="5040" to-port="0" /> <edge from-layer="5028" from-port="0" to-layer="5031" to-port="1" /> <edge from-layer="5029" from-port="0" to-layer="5031" to-port="2" /> <edge from-layer="5030" from-port="0" to-layer="5031" to-port="3" /> <edge from-layer="5031" from-port="5" to-layer="5033" to-port="0" /> <edge from-layer="5032" from-port="0" to-layer="5033" to-port="1" /> <edge from-layer="5033" from-port="2" to-layer="5038" to-port="0" /> <edge from-layer="5034" from-port="0" to-layer="5037" to-port="1" /> <edge from-layer="5035" from-port="0" to-layer="5037" to-port="2" /> <edge from-layer="5036" from-port="0" to-layer="5037" to-port="3" /> <edge from-layer="5037" from-port="5" to-layer="5038" to-port="1" /> <edge from-layer="5038" from-port="2" to-layer="5039" to-port="0" /> <edge from-layer="5039" from-port="2" to-layer="5040" to-port="1" /> <edge from-layer="5040" from-port="2" to-layer="5097" to-port="0" /> <edge from-layer="5041" from-port="1" to-layer="5043" to-port="0" /> <edge from-layer="5042" from-port="0" to-layer="5043" to-port="2" /> <edge from-layer="5043" from-port="3" to-layer="5071" to-port="0" /> <edge from-layer="5044" from-port="0" to-layer="5045" to-port="0" /> <edge from-layer="5045" from-port="1" to-layer="5048" to-port="0" /> <edge from-layer="5046" from-port="0" to-layer="5047" to-port="0" /> <edge from-layer="5047" from-port="1" to-layer="5048" to-port="1" /> <edge from-layer="5048" from-port="2" to-layer="5050" to-port="0" /> <edge from-layer="5049" from-port="0" to-layer="5050" to-port="1" /> <edge from-layer="5050" from-port="2" to-layer="5051" to-port="0" /> <edge from-layer="5051" from-port="1" to-layer="5052" to-port="1" /> <edge from-layer="5052" from-port="2" to-layer="5054" to-port="0" /> <edge from-layer="5053" from-port="0" to-layer="5054" to-port="1" /> <edge from-layer="5054" from-port="2" to-layer="5056" to-port="0" /> <edge from-layer="5055" from-port="0" to-layer="5056" to-port="1" /> <edge from-layer="5056" from-port="2" to-layer="5061" to-port="0" /> <edge from-layer="5056" from-port="2" to-layer="5057" to-port="0" /> <edge from-layer="5056" from-port="2" to-layer="5067" to-port="0" /> <edge from-layer="5057" from-port="2" to-layer="5070" to-port="0" /> <edge from-layer="5058" from-port="0" to-layer="5061" to-port="1" /> <edge from-layer="5059" from-port="0" to-layer="5061" to-port="2" /> <edge from-layer="5060" from-port="0" to-layer="5061" to-port="3" /> <edge from-layer="5061" from-port="5" to-layer="5063" to-port="0" /> <edge from-layer="5062" from-port="0" to-layer="5063" to-port="1" /> <edge from-layer="5063" from-port="2" to-layer="5068" to-port="0" /> <edge from-layer="5064" from-port="0" to-layer="5067" to-port="1" /> <edge from-layer="5065" from-port="0" to-layer="5067" to-port="2" /> <edge from-layer="5066" from-port="0" to-layer="5067" to-port="3" /> <edge from-layer="5067" from-port="5" to-layer="5068" to-port="1" /> <edge from-layer="5068" from-port="2" to-layer="5069" to-port="0" /> <edge from-layer="5069" from-port="2" to-layer="5070" to-port="1" /> <edge from-layer="5070" from-port="2" to-layer="5071" to-port="1" /> <edge from-layer="5071" from-port="2" to-layer="6130" to-port="0" /> <edge from-layer="5071" from-port="2" to-layer="5072" to-port="0" /> <edge from-layer="5072" from-port="2" to-layer="5073" to-port="0" /> <edge from-layer="5073" from-port="2" to-layer="5075" to-port="0" /> <edge from-layer="5074" from-port="0" to-layer="5075" to-port="1" /> <edge from-layer="5075" from-port="2" to-layer="5097" to-port="1" /> <edge from-layer="5076" from-port="1" to-layer="5078" to-port="0" /> <edge from-layer="5077" from-port="0" to-layer="5078" to-port="2" /> <edge from-layer="5078" from-port="3" to-layer="5092" to-port="0" /> <edge from-layer="5079" from-port="0" to-layer="5080" to-port="0" /> <edge from-layer="5080" from-port="1" to-layer="5083" to-port="0" /> <edge from-layer="5081" from-port="0" to-layer="5082" to-port="0" /> <edge from-layer="5082" from-port="1" to-layer="5083" to-port="1" /> <edge from-layer="5083" from-port="2" to-layer="5085" to-port="0" /> <edge from-layer="5084" from-port="0" to-layer="5085" to-port="1" /> <edge from-layer="5085" from-port="2" to-layer="5086" to-port="0" /> <edge from-layer="5086" from-port="1" to-layer="5087" to-port="1" /> <edge from-layer="5087" from-port="2" to-layer="5089" to-port="0" /> <edge from-layer="5088" from-port="0" to-layer="5089" to-port="1" /> <edge from-layer="5089" from-port="2" to-layer="5091" to-port="0" /> <edge from-layer="5090" from-port="0" to-layer="5091" to-port="1" /> <edge from-layer="5091" from-port="2" to-layer="5092" to-port="1" /> <edge from-layer="5092" from-port="2" to-layer="5093" to-port="0" /> <edge from-layer="5092" from-port="2" to-layer="6129" to-port="0" /> <edge from-layer="5093" from-port="2" to-layer="5094" to-port="0" /> <edge from-layer="5094" from-port="2" to-layer="5096" to-port="0" /> <edge from-layer="5095" from-port="0" to-layer="5096" to-port="1" /> <edge from-layer="5096" from-port="2" to-layer="5097" to-port="2" /> <edge from-layer="5097" from-port="4" to-layer="5099" to-port="0" /> <edge from-layer="5098" from-port="0" to-layer="5099" to-port="1" /> <edge from-layer="5099" from-port="2" to-layer="5100" to-port="0" /> <edge from-layer="5100" from-port="2" to-layer="5109" to-port="0" /> <edge from-layer="5101" from-port="0" to-layer="5102" to-port="0" /> <edge from-layer="5102" from-port="1" to-layer="5105" to-port="0" /> <edge from-layer="5103" from-port="0" to-layer="5104" to-port="0" /> <edge from-layer="5104" from-port="1" to-layer="5105" to-port="1" /> <edge from-layer="5105" from-port="2" to-layer="5107" to-port="0" /> <edge from-layer="5106" from-port="0" to-layer="5107" to-port="1" /> <edge from-layer="5107" from-port="2" to-layer="5108" to-port="0" /> <edge from-layer="5108" from-port="1" to-layer="5109" to-port="1" /> <edge from-layer="5109" from-port="2" to-layer="5110" to-port="1" /> <edge from-layer="5110" from-port="2" to-layer="5152" to-port="0" /> <edge from-layer="5110" from-port="2" to-layer="5114" to-port="0" /> <edge from-layer="5110" from-port="2" to-layer="5121" to-port="0" /> <edge from-layer="5111" from-port="0" to-layer="5122" to-port="0" /> <edge from-layer="5112" from-port="0" to-layer="5120" to-port="0" /> <edge from-layer="5113" from-port="0" to-layer="5114" to-port="1" /> <edge from-layer="5114" from-port="2" to-layer="5116" to-port="0" /> <edge from-layer="5115" from-port="0" to-layer="5116" to-port="1" /> <edge from-layer="5116" from-port="2" to-layer="5118" to-port="0" /> <edge from-layer="5117" from-port="0" to-layer="5118" to-port="1" /> <edge from-layer="5118" from-port="2" to-layer="5119" to-port="0" /> <edge from-layer="5119" from-port="1" to-layer="5120" to-port="1" /> <edge from-layer="5120" from-port="2" to-layer="5121" to-port="1" /> <edge from-layer="5121" from-port="2" to-layer="5122" to-port="1" /> <edge from-layer="5122" from-port="2" to-layer="5131" to-port="0" /> <edge from-layer="5122" from-port="2" to-layer="5141" to-port="0" /> <edge from-layer="5123" from-port="0" to-layer="5124" to-port="0" /> <edge from-layer="5124" from-port="1" to-layer="5127" to-port="0" /> <edge from-layer="5125" from-port="0" to-layer="5126" to-port="0" /> <edge from-layer="5126" from-port="1" to-layer="5127" to-port="1" /> <edge from-layer="5127" from-port="2" to-layer="5129" to-port="0" /> <edge from-layer="5128" from-port="0" to-layer="5129" to-port="1" /> <edge from-layer="5129" from-port="2" to-layer="5130" to-port="0" /> <edge from-layer="5130" from-port="1" to-layer="5131" to-port="1" /> <edge from-layer="5131" from-port="2" to-layer="5132" to-port="0" /> <edge from-layer="5132" from-port="1" to-layer="5142" to-port="0" /> <edge from-layer="5133" from-port="0" to-layer="5134" to-port="0" /> <edge from-layer="5134" from-port="1" to-layer="5137" to-port="0" /> <edge from-layer="5135" from-port="0" to-layer="5136" to-port="0" /> <edge from-layer="5136" from-port="1" to-layer="5137" to-port="1" /> <edge from-layer="5137" from-port="2" to-layer="5139" to-port="0" /> <edge from-layer="5138" from-port="0" to-layer="5139" to-port="1" /> <edge from-layer="5139" from-port="2" to-layer="5140" to-port="0" /> <edge from-layer="5140" from-port="1" to-layer="5141" to-port="1" /> <edge from-layer="5141" from-port="2" to-layer="5142" to-port="1" /> <edge from-layer="5142" from-port="2" to-layer="5151" to-port="0" /> <edge from-layer="5143" from-port="0" to-layer="5144" to-port="0" /> <edge from-layer="5144" from-port="1" to-layer="5147" to-port="0" /> <edge from-layer="5145" from-port="0" to-layer="5146" to-port="0" /> <edge from-layer="5146" from-port="1" to-layer="5147" to-port="1" /> <edge from-layer="5147" from-port="2" to-layer="5149" to-port="0" /> <edge from-layer="5148" from-port="0" to-layer="5149" to-port="1" /> <edge from-layer="5149" from-port="2" to-layer="5150" to-port="0" /> <edge from-layer="5150" from-port="1" to-layer="5151" to-port="1" /> <edge from-layer="5151" from-port="2" to-layer="5152" to-port="1" /> <edge from-layer="5152" from-port="2" to-layer="5261" to-port="0" /> <edge from-layer="5152" from-port="2" to-layer="5156" to-port="0" /> <edge from-layer="5152" from-port="2" to-layer="5163" to-port="0" /> <edge from-layer="5153" from-port="0" to-layer="5164" to-port="0" /> <edge from-layer="5154" from-port="0" to-layer="5162" to-port="0" /> <edge from-layer="5155" from-port="0" to-layer="5156" to-port="1" /> <edge from-layer="5156" from-port="2" to-layer="5158" to-port="0" /> <edge from-layer="5157" from-port="0" to-layer="5158" to-port="1" /> <edge from-layer="5158" from-port="2" to-layer="5160" to-port="0" /> <edge from-layer="5159" from-port="0" to-layer="5160" to-port="1" /> <edge from-layer="5160" from-port="2" to-layer="5161" to-port="0" /> <edge from-layer="5161" from-port="1" to-layer="5162" to-port="1" /> <edge from-layer="5162" from-port="2" to-layer="5163" to-port="1" /> <edge from-layer="5163" from-port="2" to-layer="5164" to-port="1" /> <edge from-layer="5164" from-port="2" to-layer="5203" to-port="0" /> <edge from-layer="5164" from-port="2" to-layer="5173" to-port="0" /> <edge from-layer="5164" from-port="2" to-layer="5238" to-port="0" /> <edge from-layer="5165" from-port="0" to-layer="5166" to-port="0" /> <edge from-layer="5166" from-port="1" to-layer="5169" to-port="0" /> <edge from-layer="5167" from-port="0" to-layer="5168" to-port="0" /> <edge from-layer="5168" from-port="1" to-layer="5169" to-port="1" /> <edge from-layer="5169" from-port="2" to-layer="5171" to-port="0" /> <edge from-layer="5170" from-port="0" to-layer="5171" to-port="1" /> <edge from-layer="5171" from-port="2" to-layer="5172" to-port="0" /> <edge from-layer="5172" from-port="1" to-layer="5173" to-port="1" /> <edge from-layer="5173" from-port="2" to-layer="5175" to-port="0" /> <edge from-layer="5174" from-port="0" to-layer="5175" to-port="1" /> <edge from-layer="5175" from-port="2" to-layer="5177" to-port="0" /> <edge from-layer="5176" from-port="0" to-layer="5177" to-port="1" /> <edge from-layer="5177" from-port="2" to-layer="5188" to-port="0" /> <edge from-layer="5177" from-port="2" to-layer="5178" to-port="0" /> <edge from-layer="5177" from-port="2" to-layer="5182" to-port="0" /> <edge from-layer="5178" from-port="2" to-layer="5191" to-port="0" /> <edge from-layer="5179" from-port="0" to-layer="5182" to-port="1" /> <edge from-layer="5180" from-port="0" to-layer="5182" to-port="2" /> <edge from-layer="5181" from-port="0" to-layer="5182" to-port="3" /> <edge from-layer="5182" from-port="5" to-layer="5184" to-port="0" /> <edge from-layer="5183" from-port="0" to-layer="5184" to-port="1" /> <edge from-layer="5184" from-port="2" to-layer="5189" to-port="0" /> <edge from-layer="5185" from-port="0" to-layer="5188" to-port="1" /> <edge from-layer="5186" from-port="0" to-layer="5188" to-port="2" /> <edge from-layer="5187" from-port="0" to-layer="5188" to-port="3" /> <edge from-layer="5188" from-port="5" to-layer="5189" to-port="1" /> <edge from-layer="5189" from-port="2" to-layer="5190" to-port="0" /> <edge from-layer="5190" from-port="2" to-layer="5191" to-port="1" /> <edge from-layer="5191" from-port="2" to-layer="5248" to-port="0" /> <edge from-layer="5192" from-port="1" to-layer="5194" to-port="0" /> <edge from-layer="5193" from-port="0" to-layer="5194" to-port="2" /> <edge from-layer="5194" from-port="3" to-layer="5222" to-port="0" /> <edge from-layer="5195" from-port="0" to-layer="5196" to-port="0" /> <edge from-layer="5196" from-port="1" to-layer="5199" to-port="0" /> <edge from-layer="5197" from-port="0" to-layer="5198" to-port="0" /> <edge from-layer="5198" from-port="1" to-layer="5199" to-port="1" /> <edge from-layer="5199" from-port="2" to-layer="5201" to-port="0" /> <edge from-layer="5200" from-port="0" to-layer="5201" to-port="1" /> <edge from-layer="5201" from-port="2" to-layer="5202" to-port="0" /> <edge from-layer="5202" from-port="1" to-layer="5203" to-port="1" /> <edge from-layer="5203" from-port="2" to-layer="5205" to-port="0" /> <edge from-layer="5204" from-port="0" to-layer="5205" to-port="1" /> <edge from-layer="5205" from-port="2" to-layer="5207" to-port="0" /> <edge from-layer="5206" from-port="0" to-layer="5207" to-port="1" /> <edge from-layer="5207" from-port="2" to-layer="5212" to-port="0" /> <edge from-layer="5207" from-port="2" to-layer="5208" to-port="0" /> <edge from-layer="5207" from-port="2" to-layer="5218" to-port="0" /> <edge from-layer="5208" from-port="2" to-layer="5221" to-port="0" /> <edge from-layer="5209" from-port="0" to-layer="5212" to-port="1" /> <edge from-layer="5210" from-port="0" to-layer="5212" to-port="2" /> <edge from-layer="5211" from-port="0" to-layer="5212" to-port="3" /> <edge from-layer="5212" from-port="5" to-layer="5214" to-port="0" /> <edge from-layer="5213" from-port="0" to-layer="5214" to-port="1" /> <edge from-layer="5214" from-port="2" to-layer="5219" to-port="0" /> <edge from-layer="5215" from-port="0" to-layer="5218" to-port="1" /> <edge from-layer="5216" from-port="0" to-layer="5218" to-port="2" /> <edge from-layer="5217" from-port="0" to-layer="5218" to-port="3" /> <edge from-layer="5218" from-port="5" to-layer="5219" to-port="1" /> <edge from-layer="5219" from-port="2" to-layer="5220" to-port="0" /> <edge from-layer="5220" from-port="2" to-layer="5221" to-port="1" /> <edge from-layer="5221" from-port="2" to-layer="5222" to-port="1" /> <edge from-layer="5222" from-port="2" to-layer="6128" to-port="0" /> <edge from-layer="5222" from-port="2" to-layer="5223" to-port="0" /> <edge from-layer="5223" from-port="2" to-layer="5224" to-port="0" /> <edge from-layer="5224" from-port="2" to-layer="5226" to-port="0" /> <edge from-layer="5225" from-port="0" to-layer="5226" to-port="1" /> <edge from-layer="5226" from-port="2" to-layer="5248" to-port="1" /> <edge from-layer="5227" from-port="1" to-layer="5229" to-port="0" /> <edge from-layer="5228" from-port="0" to-layer="5229" to-port="2" /> <edge from-layer="5229" from-port="3" to-layer="5243" to-port="0" /> <edge from-layer="5230" from-port="0" to-layer="5231" to-port="0" /> <edge from-layer="5231" from-port="1" to-layer="5234" to-port="0" /> <edge from-layer="5232" from-port="0" to-layer="5233" to-port="0" /> <edge from-layer="5233" from-port="1" to-layer="5234" to-port="1" /> <edge from-layer="5234" from-port="2" to-layer="5236" to-port="0" /> <edge from-layer="5235" from-port="0" to-layer="5236" to-port="1" /> <edge from-layer="5236" from-port="2" to-layer="5237" to-port="0" /> <edge from-layer="5237" from-port="1" to-layer="5238" to-port="1" /> <edge from-layer="5238" from-port="2" to-layer="5240" to-port="0" /> <edge from-layer="5239" from-port="0" to-layer="5240" to-port="1" /> <edge from-layer="5240" from-port="2" to-layer="5242" to-port="0" /> <edge from-layer="5241" from-port="0" to-layer="5242" to-port="1" /> <edge from-layer="5242" from-port="2" to-layer="5243" to-port="1" /> <edge from-layer="5243" from-port="2" to-layer="6127" to-port="0" /> <edge from-layer="5243" from-port="2" to-layer="5244" to-port="0" /> <edge from-layer="5244" from-port="2" to-layer="5245" to-port="0" /> <edge from-layer="5245" from-port="2" to-layer="5247" to-port="0" /> <edge from-layer="5246" from-port="0" to-layer="5247" to-port="1" /> <edge from-layer="5247" from-port="2" to-layer="5248" to-port="2" /> <edge from-layer="5248" from-port="4" to-layer="5250" to-port="0" /> <edge from-layer="5249" from-port="0" to-layer="5250" to-port="1" /> <edge from-layer="5250" from-port="2" to-layer="5251" to-port="0" /> <edge from-layer="5251" from-port="2" to-layer="5260" to-port="0" /> <edge from-layer="5252" from-port="0" to-layer="5253" to-port="0" /> <edge from-layer="5253" from-port="1" to-layer="5256" to-port="0" /> <edge from-layer="5254" from-port="0" to-layer="5255" to-port="0" /> <edge from-layer="5255" from-port="1" to-layer="5256" to-port="1" /> <edge from-layer="5256" from-port="2" to-layer="5258" to-port="0" /> <edge from-layer="5257" from-port="0" to-layer="5258" to-port="1" /> <edge from-layer="5258" from-port="2" to-layer="5259" to-port="0" /> <edge from-layer="5259" from-port="1" to-layer="5260" to-port="1" /> <edge from-layer="5260" from-port="2" to-layer="5261" to-port="1" /> <edge from-layer="5261" from-port="2" to-layer="5265" to-port="0" /> <edge from-layer="5261" from-port="2" to-layer="5272" to-port="0" /> <edge from-layer="5261" from-port="2" to-layer="5303" to-port="0" /> <edge from-layer="5262" from-port="0" to-layer="5273" to-port="0" /> <edge from-layer="5263" from-port="0" to-layer="5271" to-port="0" /> <edge from-layer="5264" from-port="0" to-layer="5265" to-port="1" /> <edge from-layer="5265" from-port="2" to-layer="5267" to-port="0" /> <edge from-layer="5266" from-port="0" to-layer="5267" to-port="1" /> <edge from-layer="5267" from-port="2" to-layer="5269" to-port="0" /> <edge from-layer="5268" from-port="0" to-layer="5269" to-port="1" /> <edge from-layer="5269" from-port="2" to-layer="5270" to-port="0" /> <edge from-layer="5270" from-port="1" to-layer="5271" to-port="1" /> <edge from-layer="5271" from-port="2" to-layer="5272" to-port="1" /> <edge from-layer="5272" from-port="2" to-layer="5273" to-port="1" /> <edge from-layer="5273" from-port="2" to-layer="5292" to-port="0" /> <edge from-layer="5273" from-port="2" to-layer="5282" to-port="0" /> <edge from-layer="5274" from-port="0" to-layer="5275" to-port="0" /> <edge from-layer="5275" from-port="1" to-layer="5278" to-port="0" /> <edge from-layer="5276" from-port="0" to-layer="5277" to-port="0" /> <edge from-layer="5277" from-port="1" to-layer="5278" to-port="1" /> <edge from-layer="5278" from-port="2" to-layer="5280" to-port="0" /> <edge from-layer="5279" from-port="0" to-layer="5280" to-port="1" /> <edge from-layer="5280" from-port="2" to-layer="5281" to-port="0" /> <edge from-layer="5281" from-port="1" to-layer="5282" to-port="1" /> <edge from-layer="5282" from-port="2" to-layer="5283" to-port="0" /> <edge from-layer="5283" from-port="1" to-layer="5293" to-port="0" /> <edge from-layer="5284" from-port="0" to-layer="5285" to-port="0" /> <edge from-layer="5285" from-port="1" to-layer="5288" to-port="0" /> <edge from-layer="5286" from-port="0" to-layer="5287" to-port="0" /> <edge from-layer="5287" from-port="1" to-layer="5288" to-port="1" /> <edge from-layer="5288" from-port="2" to-layer="5290" to-port="0" /> <edge from-layer="5289" from-port="0" to-layer="5290" to-port="1" /> <edge from-layer="5290" from-port="2" to-layer="5291" to-port="0" /> <edge from-layer="5291" from-port="1" to-layer="5292" to-port="1" /> <edge from-layer="5292" from-port="2" to-layer="5293" to-port="1" /> <edge from-layer="5293" from-port="2" to-layer="5302" to-port="0" /> <edge from-layer="5294" from-port="0" to-layer="5295" to-port="0" /> <edge from-layer="5295" from-port="1" to-layer="5298" to-port="0" /> <edge from-layer="5296" from-port="0" to-layer="5297" to-port="0" /> <edge from-layer="5297" from-port="1" to-layer="5298" to-port="1" /> <edge from-layer="5298" from-port="2" to-layer="5300" to-port="0" /> <edge from-layer="5299" from-port="0" to-layer="5300" to-port="1" /> <edge from-layer="5300" from-port="2" to-layer="5301" to-port="0" /> <edge from-layer="5301" from-port="1" to-layer="5302" to-port="1" /> <edge from-layer="5302" from-port="2" to-layer="5303" to-port="1" /> <edge from-layer="5303" from-port="2" to-layer="5412" to-port="0" /> <edge from-layer="5303" from-port="2" to-layer="5307" to-port="0" /> <edge from-layer="5303" from-port="2" to-layer="5314" to-port="0" /> <edge from-layer="5304" from-port="0" to-layer="5315" to-port="0" /> <edge from-layer="5305" from-port="0" to-layer="5313" to-port="0" /> <edge from-layer="5306" from-port="0" to-layer="5307" to-port="1" /> <edge from-layer="5307" from-port="2" to-layer="5309" to-port="0" /> <edge from-layer="5308" from-port="0" to-layer="5309" to-port="1" /> <edge from-layer="5309" from-port="2" to-layer="5311" to-port="0" /> <edge from-layer="5310" from-port="0" to-layer="5311" to-port="1" /> <edge from-layer="5311" from-port="2" to-layer="5312" to-port="0" /> <edge from-layer="5312" from-port="1" to-layer="5313" to-port="1" /> <edge from-layer="5313" from-port="2" to-layer="5314" to-port="1" /> <edge from-layer="5314" from-port="2" to-layer="5315" to-port="1" /> <edge from-layer="5315" from-port="2" to-layer="5389" to-port="0" /> <edge from-layer="5315" from-port="2" to-layer="5354" to-port="0" /> <edge from-layer="5315" from-port="2" to-layer="5324" to-port="0" /> <edge from-layer="5316" from-port="0" to-layer="5317" to-port="0" /> <edge from-layer="5317" from-port="1" to-layer="5320" to-port="0" /> <edge from-layer="5318" from-port="0" to-layer="5319" to-port="0" /> <edge from-layer="5319" from-port="1" to-layer="5320" to-port="1" /> <edge from-layer="5320" from-port="2" to-layer="5322" to-port="0" /> <edge from-layer="5321" from-port="0" to-layer="5322" to-port="1" /> <edge from-layer="5322" from-port="2" to-layer="5323" to-port="0" /> <edge from-layer="5323" from-port="1" to-layer="5324" to-port="1" /> <edge from-layer="5324" from-port="2" to-layer="5326" to-port="0" /> <edge from-layer="5325" from-port="0" to-layer="5326" to-port="1" /> <edge from-layer="5326" from-port="2" to-layer="5328" to-port="0" /> <edge from-layer="5327" from-port="0" to-layer="5328" to-port="1" /> <edge from-layer="5328" from-port="2" to-layer="5339" to-port="0" /> <edge from-layer="5328" from-port="2" to-layer="5329" to-port="0" /> <edge from-layer="5328" from-port="2" to-layer="5333" to-port="0" /> <edge from-layer="5329" from-port="2" to-layer="5342" to-port="0" /> <edge from-layer="5330" from-port="0" to-layer="5333" to-port="1" /> <edge from-layer="5331" from-port="0" to-layer="5333" to-port="2" /> <edge from-layer="5332" from-port="0" to-layer="5333" to-port="3" /> <edge from-layer="5333" from-port="5" to-layer="5335" to-port="0" /> <edge from-layer="5334" from-port="0" to-layer="5335" to-port="1" /> <edge from-layer="5335" from-port="2" to-layer="5340" to-port="0" /> <edge from-layer="5336" from-port="0" to-layer="5339" to-port="1" /> <edge from-layer="5337" from-port="0" to-layer="5339" to-port="2" /> <edge from-layer="5338" from-port="0" to-layer="5339" to-port="3" /> <edge from-layer="5339" from-port="5" to-layer="5340" to-port="1" /> <edge from-layer="5340" from-port="2" to-layer="5341" to-port="0" /> <edge from-layer="5341" from-port="2" to-layer="5342" to-port="1" /> <edge from-layer="5342" from-port="2" to-layer="5399" to-port="0" /> <edge from-layer="5343" from-port="1" to-layer="5345" to-port="0" /> <edge from-layer="5344" from-port="0" to-layer="5345" to-port="2" /> <edge from-layer="5345" from-port="3" to-layer="5373" to-port="0" /> <edge from-layer="5346" from-port="0" to-layer="5347" to-port="0" /> <edge from-layer="5347" from-port="1" to-layer="5350" to-port="0" /> <edge from-layer="5348" from-port="0" to-layer="5349" to-port="0" /> <edge from-layer="5349" from-port="1" to-layer="5350" to-port="1" /> <edge from-layer="5350" from-port="2" to-layer="5352" to-port="0" /> <edge from-layer="5351" from-port="0" to-layer="5352" to-port="1" /> <edge from-layer="5352" from-port="2" to-layer="5353" to-port="0" /> <edge from-layer="5353" from-port="1" to-layer="5354" to-port="1" /> <edge from-layer="5354" from-port="2" to-layer="5356" to-port="0" /> <edge from-layer="5355" from-port="0" to-layer="5356" to-port="1" /> <edge from-layer="5356" from-port="2" to-layer="5358" to-port="0" /> <edge from-layer="5357" from-port="0" to-layer="5358" to-port="1" /> <edge from-layer="5358" from-port="2" to-layer="5359" to-port="0" /> <edge from-layer="5358" from-port="2" to-layer="5363" to-port="0" /> <edge from-layer="5358" from-port="2" to-layer="5369" to-port="0" /> <edge from-layer="5359" from-port="2" to-layer="5372" to-port="0" /> <edge from-layer="5360" from-port="0" to-layer="5363" to-port="1" /> <edge from-layer="5361" from-port="0" to-layer="5363" to-port="2" /> <edge from-layer="5362" from-port="0" to-layer="5363" to-port="3" /> <edge from-layer="5363" from-port="5" to-layer="5365" to-port="0" /> <edge from-layer="5364" from-port="0" to-layer="5365" to-port="1" /> <edge from-layer="5365" from-port="2" to-layer="5370" to-port="0" /> <edge from-layer="5366" from-port="0" to-layer="5369" to-port="1" /> <edge from-layer="5367" from-port="0" to-layer="5369" to-port="2" /> <edge from-layer="5368" from-port="0" to-layer="5369" to-port="3" /> <edge from-layer="5369" from-port="5" to-layer="5370" to-port="1" /> <edge from-layer="5370" from-port="2" to-layer="5371" to-port="0" /> <edge from-layer="5371" from-port="2" to-layer="5372" to-port="1" /> <edge from-layer="5372" from-port="2" to-layer="5373" to-port="1" /> <edge from-layer="5373" from-port="2" to-layer="5374" to-port="0" /> <edge from-layer="5373" from-port="2" to-layer="6126" to-port="0" /> <edge from-layer="5374" from-port="2" to-layer="5375" to-port="0" /> <edge from-layer="5375" from-port="2" to-layer="5377" to-port="0" /> <edge from-layer="5376" from-port="0" to-layer="5377" to-port="1" /> <edge from-layer="5377" from-port="2" to-layer="5399" to-port="1" /> <edge from-layer="5378" from-port="1" to-layer="5380" to-port="0" /> <edge from-layer="5379" from-port="0" to-layer="5380" to-port="2" /> <edge from-layer="5380" from-port="3" to-layer="5394" to-port="0" /> <edge from-layer="5381" from-port="0" to-layer="5382" to-port="0" /> <edge from-layer="5382" from-port="1" to-layer="5385" to-port="0" /> <edge from-layer="5383" from-port="0" to-layer="5384" to-port="0" /> <edge from-layer="5384" from-port="1" to-layer="5385" to-port="1" /> <edge from-layer="5385" from-port="2" to-layer="5387" to-port="0" /> <edge from-layer="5386" from-port="0" to-layer="5387" to-port="1" /> <edge from-layer="5387" from-port="2" to-layer="5388" to-port="0" /> <edge from-layer="5388" from-port="1" to-layer="5389" to-port="1" /> <edge from-layer="5389" from-port="2" to-layer="5391" to-port="0" /> <edge from-layer="5390" from-port="0" to-layer="5391" to-port="1" /> <edge from-layer="5391" from-port="2" to-layer="5393" to-port="0" /> <edge from-layer="5392" from-port="0" to-layer="5393" to-port="1" /> <edge from-layer="5393" from-port="2" to-layer="5394" to-port="1" /> <edge from-layer="5394" from-port="2" to-layer="5395" to-port="0" /> <edge from-layer="5394" from-port="2" to-layer="6125" to-port="0" /> <edge from-layer="5395" from-port="2" to-layer="5396" to-port="0" /> <edge from-layer="5396" from-port="2" to-layer="5398" to-port="0" /> <edge from-layer="5397" from-port="0" to-layer="5398" to-port="1" /> <edge from-layer="5398" from-port="2" to-layer="5399" to-port="2" /> <edge from-layer="5399" from-port="4" to-layer="5401" to-port="0" /> <edge from-layer="5400" from-port="0" to-layer="5401" to-port="1" /> <edge from-layer="5401" from-port="2" to-layer="5402" to-port="0" /> <edge from-layer="5402" from-port="2" to-layer="5411" to-port="0" /> <edge from-layer="5403" from-port="0" to-layer="5404" to-port="0" /> <edge from-layer="5404" from-port="1" to-layer="5407" to-port="0" /> <edge from-layer="5405" from-port="0" to-layer="5406" to-port="0" /> <edge from-layer="5406" from-port="1" to-layer="5407" to-port="1" /> <edge from-layer="5407" from-port="2" to-layer="5409" to-port="0" /> <edge from-layer="5408" from-port="0" to-layer="5409" to-port="1" /> <edge from-layer="5409" from-port="2" to-layer="5410" to-port="0" /> <edge from-layer="5410" from-port="1" to-layer="5411" to-port="1" /> <edge from-layer="5411" from-port="2" to-layer="5412" to-port="1" /> <edge from-layer="5412" from-port="2" to-layer="5423" to-port="0" /> <edge from-layer="5412" from-port="2" to-layer="5454" to-port="0" /> <edge from-layer="5412" from-port="2" to-layer="5416" to-port="0" /> <edge from-layer="5413" from-port="0" to-layer="5424" to-port="0" /> <edge from-layer="5414" from-port="0" to-layer="5422" to-port="0" /> <edge from-layer="5415" from-port="0" to-layer="5416" to-port="1" /> <edge from-layer="5416" from-port="2" to-layer="5418" to-port="0" /> <edge from-layer="5417" from-port="0" to-layer="5418" to-port="1" /> <edge from-layer="5418" from-port="2" to-layer="5420" to-port="0" /> <edge from-layer="5419" from-port="0" to-layer="5420" to-port="1" /> <edge from-layer="5420" from-port="2" to-layer="5421" to-port="0" /> <edge from-layer="5421" from-port="1" to-layer="5422" to-port="1" /> <edge from-layer="5422" from-port="2" to-layer="5423" to-port="1" /> <edge from-layer="5423" from-port="2" to-layer="5424" to-port="1" /> <edge from-layer="5424" from-port="2" to-layer="5433" to-port="0" /> <edge from-layer="5424" from-port="2" to-layer="5443" to-port="0" /> <edge from-layer="5425" from-port="0" to-layer="5426" to-port="0" /> <edge from-layer="5426" from-port="1" to-layer="5429" to-port="0" /> <edge from-layer="5427" from-port="0" to-layer="5428" to-port="0" /> <edge from-layer="5428" from-port="1" to-layer="5429" to-port="1" /> <edge from-layer="5429" from-port="2" to-layer="5431" to-port="0" /> <edge from-layer="5430" from-port="0" to-layer="5431" to-port="1" /> <edge from-layer="5431" from-port="2" to-layer="5432" to-port="0" /> <edge from-layer="5432" from-port="1" to-layer="5433" to-port="1" /> <edge from-layer="5433" from-port="2" to-layer="5434" to-port="0" /> <edge from-layer="5434" from-port="1" to-layer="5444" to-port="0" /> <edge from-layer="5435" from-port="0" to-layer="5436" to-port="0" /> <edge from-layer="5436" from-port="1" to-layer="5439" to-port="0" /> <edge from-layer="5437" from-port="0" to-layer="5438" to-port="0" /> <edge from-layer="5438" from-port="1" to-layer="5439" to-port="1" /> <edge from-layer="5439" from-port="2" to-layer="5441" to-port="0" /> <edge from-layer="5440" from-port="0" to-layer="5441" to-port="1" /> <edge from-layer="5441" from-port="2" to-layer="5442" to-port="0" /> <edge from-layer="5442" from-port="1" to-layer="5443" to-port="1" /> <edge from-layer="5443" from-port="2" to-layer="5444" to-port="1" /> <edge from-layer="5444" from-port="2" to-layer="5453" to-port="0" /> <edge from-layer="5445" from-port="0" to-layer="5446" to-port="0" /> <edge from-layer="5446" from-port="1" to-layer="5449" to-port="0" /> <edge from-layer="5447" from-port="0" to-layer="5448" to-port="0" /> <edge from-layer="5448" from-port="1" to-layer="5449" to-port="1" /> <edge from-layer="5449" from-port="2" to-layer="5451" to-port="0" /> <edge from-layer="5450" from-port="0" to-layer="5451" to-port="1" /> <edge from-layer="5451" from-port="2" to-layer="5452" to-port="0" /> <edge from-layer="5452" from-port="1" to-layer="5453" to-port="1" /> <edge from-layer="5453" from-port="2" to-layer="5454" to-port="1" /> <edge from-layer="5454" from-port="2" to-layer="5563" to-port="0" /> <edge from-layer="5454" from-port="2" to-layer="5458" to-port="0" /> <edge from-layer="5454" from-port="2" to-layer="5465" to-port="0" /> <edge from-layer="5455" from-port="0" to-layer="5466" to-port="0" /> <edge from-layer="5456" from-port="0" to-layer="5464" to-port="0" /> <edge from-layer="5457" from-port="0" to-layer="5458" to-port="1" /> <edge from-layer="5458" from-port="2" to-layer="5460" to-port="0" /> <edge from-layer="5459" from-port="0" to-layer="5460" to-port="1" /> <edge from-layer="5460" from-port="2" to-layer="5462" to-port="0" /> <edge from-layer="5461" from-port="0" to-layer="5462" to-port="1" /> <edge from-layer="5462" from-port="2" to-layer="5463" to-port="0" /> <edge from-layer="5463" from-port="1" to-layer="5464" to-port="1" /> <edge from-layer="5464" from-port="2" to-layer="5465" to-port="1" /> <edge from-layer="5465" from-port="2" to-layer="5466" to-port="1" /> <edge from-layer="5466" from-port="2" to-layer="5475" to-port="0" /> <edge from-layer="5466" from-port="2" to-layer="5505" to-port="0" /> <edge from-layer="5466" from-port="2" to-layer="5540" to-port="0" /> <edge from-layer="5467" from-port="0" to-layer="5468" to-port="0" /> <edge from-layer="5468" from-port="1" to-layer="5471" to-port="0" /> <edge from-layer="5469" from-port="0" to-layer="5470" to-port="0" /> <edge from-layer="5470" from-port="1" to-layer="5471" to-port="1" /> <edge from-layer="5471" from-port="2" to-layer="5473" to-port="0" /> <edge from-layer="5472" from-port="0" to-layer="5473" to-port="1" /> <edge from-layer="5473" from-port="2" to-layer="5474" to-port="0" /> <edge from-layer="5474" from-port="1" to-layer="5475" to-port="1" /> <edge from-layer="5475" from-port="2" to-layer="5477" to-port="0" /> <edge from-layer="5476" from-port="0" to-layer="5477" to-port="1" /> <edge from-layer="5477" from-port="2" to-layer="5479" to-port="0" /> <edge from-layer="5478" from-port="0" to-layer="5479" to-port="1" /> <edge from-layer="5479" from-port="2" to-layer="5484" to-port="0" /> <edge from-layer="5479" from-port="2" to-layer="5490" to-port="0" /> <edge from-layer="5479" from-port="2" to-layer="5480" to-port="0" /> <edge from-layer="5480" from-port="2" to-layer="5493" to-port="0" /> <edge from-layer="5481" from-port="0" to-layer="5484" to-port="1" /> <edge from-layer="5482" from-port="0" to-layer="5484" to-port="2" /> <edge from-layer="5483" from-port="0" to-layer="5484" to-port="3" /> <edge from-layer="5484" from-port="5" to-layer="5486" to-port="0" /> <edge from-layer="5485" from-port="0" to-layer="5486" to-port="1" /> <edge from-layer="5486" from-port="2" to-layer="5491" to-port="0" /> <edge from-layer="5487" from-port="0" to-layer="5490" to-port="1" /> <edge from-layer="5488" from-port="0" to-layer="5490" to-port="2" /> <edge from-layer="5489" from-port="0" to-layer="5490" to-port="3" /> <edge from-layer="5490" from-port="5" to-layer="5491" to-port="1" /> <edge from-layer="5491" from-port="2" to-layer="5492" to-port="0" /> <edge from-layer="5492" from-port="2" to-layer="5493" to-port="1" /> <edge from-layer="5493" from-port="2" to-layer="5550" to-port="0" /> <edge from-layer="5494" from-port="1" to-layer="5496" to-port="0" /> <edge from-layer="5495" from-port="0" to-layer="5496" to-port="2" /> <edge from-layer="5496" from-port="3" to-layer="5524" to-port="0" /> <edge from-layer="5497" from-port="0" to-layer="5498" to-port="0" /> <edge from-layer="5498" from-port="1" to-layer="5501" to-port="0" /> <edge from-layer="5499" from-port="0" to-layer="5500" to-port="0" /> <edge from-layer="5500" from-port="1" to-layer="5501" to-port="1" /> <edge from-layer="5501" from-port="2" to-layer="5503" to-port="0" /> <edge from-layer="5502" from-port="0" to-layer="5503" to-port="1" /> <edge from-layer="5503" from-port="2" to-layer="5504" to-port="0" /> <edge from-layer="5504" from-port="1" to-layer="5505" to-port="1" /> <edge from-layer="5505" from-port="2" to-layer="5507" to-port="0" /> <edge from-layer="5506" from-port="0" to-layer="5507" to-port="1" /> <edge from-layer="5507" from-port="2" to-layer="5509" to-port="0" /> <edge from-layer="5508" from-port="0" to-layer="5509" to-port="1" /> <edge from-layer="5509" from-port="2" to-layer="5514" to-port="0" /> <edge from-layer="5509" from-port="2" to-layer="5520" to-port="0" /> <edge from-layer="5509" from-port="2" to-layer="5510" to-port="0" /> <edge from-layer="5510" from-port="2" to-layer="5523" to-port="0" /> <edge from-layer="5511" from-port="0" to-layer="5514" to-port="1" /> <edge from-layer="5512" from-port="0" to-layer="5514" to-port="2" /> <edge from-layer="5513" from-port="0" to-layer="5514" to-port="3" /> <edge from-layer="5514" from-port="5" to-layer="5516" to-port="0" /> <edge from-layer="5515" from-port="0" to-layer="5516" to-port="1" /> <edge from-layer="5516" from-port="2" to-layer="5521" to-port="0" /> <edge from-layer="5517" from-port="0" to-layer="5520" to-port="1" /> <edge from-layer="5518" from-port="0" to-layer="5520" to-port="2" /> <edge from-layer="5519" from-port="0" to-layer="5520" to-port="3" /> <edge from-layer="5520" from-port="5" to-layer="5521" to-port="1" /> <edge from-layer="5521" from-port="2" to-layer="5522" to-port="0" /> <edge from-layer="5522" from-port="2" to-layer="5523" to-port="1" /> <edge from-layer="5523" from-port="2" to-layer="5524" to-port="1" /> <edge from-layer="5524" from-port="2" to-layer="5525" to-port="0" /> <edge from-layer="5524" from-port="2" to-layer="6124" to-port="0" /> <edge from-layer="5525" from-port="2" to-layer="5526" to-port="0" /> <edge from-layer="5526" from-port="2" to-layer="5528" to-port="0" /> <edge from-layer="5527" from-port="0" to-layer="5528" to-port="1" /> <edge from-layer="5528" from-port="2" to-layer="5550" to-port="1" /> <edge from-layer="5529" from-port="1" to-layer="5531" to-port="0" /> <edge from-layer="5530" from-port="0" to-layer="5531" to-port="2" /> <edge from-layer="5531" from-port="3" to-layer="5545" to-port="0" /> <edge from-layer="5532" from-port="0" to-layer="5533" to-port="0" /> <edge from-layer="5533" from-port="1" to-layer="5536" to-port="0" /> <edge from-layer="5534" from-port="0" to-layer="5535" to-port="0" /> <edge from-layer="5535" from-port="1" to-layer="5536" to-port="1" /> <edge from-layer="5536" from-port="2" to-layer="5538" to-port="0" /> <edge from-layer="5537" from-port="0" to-layer="5538" to-port="1" /> <edge from-layer="5538" from-port="2" to-layer="5539" to-port="0" /> <edge from-layer="5539" from-port="1" to-layer="5540" to-port="1" /> <edge from-layer="5540" from-port="2" to-layer="5542" to-port="0" /> <edge from-layer="5541" from-port="0" to-layer="5542" to-port="1" /> <edge from-layer="5542" from-port="2" to-layer="5544" to-port="0" /> <edge from-layer="5543" from-port="0" to-layer="5544" to-port="1" /> <edge from-layer="5544" from-port="2" to-layer="5545" to-port="1" /> <edge from-layer="5545" from-port="2" to-layer="5546" to-port="0" /> <edge from-layer="5545" from-port="2" to-layer="6123" to-port="0" /> <edge from-layer="5546" from-port="2" to-layer="5547" to-port="0" /> <edge from-layer="5547" from-port="2" to-layer="5549" to-port="0" /> <edge from-layer="5548" from-port="0" to-layer="5549" to-port="1" /> <edge from-layer="5549" from-port="2" to-layer="5550" to-port="2" /> <edge from-layer="5550" from-port="4" to-layer="5552" to-port="0" /> <edge from-layer="5551" from-port="0" to-layer="5552" to-port="1" /> <edge from-layer="5552" from-port="2" to-layer="5553" to-port="0" /> <edge from-layer="5553" from-port="2" to-layer="5562" to-port="0" /> <edge from-layer="5554" from-port="0" to-layer="5555" to-port="0" /> <edge from-layer="5555" from-port="1" to-layer="5558" to-port="0" /> <edge from-layer="5556" from-port="0" to-layer="5557" to-port="0" /> <edge from-layer="5557" from-port="1" to-layer="5558" to-port="1" /> <edge from-layer="5558" from-port="2" to-layer="5560" to-port="0" /> <edge from-layer="5559" from-port="0" to-layer="5560" to-port="1" /> <edge from-layer="5560" from-port="2" to-layer="5561" to-port="0" /> <edge from-layer="5561" from-port="1" to-layer="5562" to-port="1" /> <edge from-layer="5562" from-port="2" to-layer="5563" to-port="1" /> <edge from-layer="5563" from-port="2" to-layer="5605" to-port="0" /> <edge from-layer="5563" from-port="2" to-layer="5567" to-port="0" /> <edge from-layer="5563" from-port="2" to-layer="5574" to-port="0" /> <edge from-layer="5564" from-port="0" to-layer="5575" to-port="0" /> <edge from-layer="5565" from-port="0" to-layer="5573" to-port="0" /> <edge from-layer="5566" from-port="0" to-layer="5567" to-port="1" /> <edge from-layer="5567" from-port="2" to-layer="5569" to-port="0" /> <edge from-layer="5568" from-port="0" to-layer="5569" to-port="1" /> <edge from-layer="5569" from-port="2" to-layer="5571" to-port="0" /> <edge from-layer="5570" from-port="0" to-layer="5571" to-port="1" /> <edge from-layer="5571" from-port="2" to-layer="5572" to-port="0" /> <edge from-layer="5572" from-port="1" to-layer="5573" to-port="1" /> <edge from-layer="5573" from-port="2" to-layer="5574" to-port="1" /> <edge from-layer="5574" from-port="2" to-layer="5575" to-port="1" /> <edge from-layer="5575" from-port="2" to-layer="5594" to-port="0" /> <edge from-layer="5575" from-port="2" to-layer="5584" to-port="0" /> <edge from-layer="5576" from-port="0" to-layer="5577" to-port="0" /> <edge from-layer="5577" from-port="1" to-layer="5580" to-port="0" /> <edge from-layer="5578" from-port="0" to-layer="5579" to-port="0" /> <edge from-layer="5579" from-port="1" to-layer="5580" to-port="1" /> <edge from-layer="5580" from-port="2" to-layer="5582" to-port="0" /> <edge from-layer="5581" from-port="0" to-layer="5582" to-port="1" /> <edge from-layer="5582" from-port="2" to-layer="5583" to-port="0" /> <edge from-layer="5583" from-port="1" to-layer="5584" to-port="1" /> <edge from-layer="5584" from-port="2" to-layer="5585" to-port="0" /> <edge from-layer="5585" from-port="1" to-layer="5595" to-port="0" /> <edge from-layer="5586" from-port="0" to-layer="5587" to-port="0" /> <edge from-layer="5587" from-port="1" to-layer="5590" to-port="0" /> <edge from-layer="5588" from-port="0" to-layer="5589" to-port="0" /> <edge from-layer="5589" from-port="1" to-layer="5590" to-port="1" /> <edge from-layer="5590" from-port="2" to-layer="5592" to-port="0" /> <edge from-layer="5591" from-port="0" to-layer="5592" to-port="1" /> <edge from-layer="5592" from-port="2" to-layer="5593" to-port="0" /> <edge from-layer="5593" from-port="1" to-layer="5594" to-port="1" /> <edge from-layer="5594" from-port="2" to-layer="5595" to-port="1" /> <edge from-layer="5595" from-port="2" to-layer="5604" to-port="0" /> <edge from-layer="5596" from-port="0" to-layer="5597" to-port="0" /> <edge from-layer="5597" from-port="1" to-layer="5600" to-port="0" /> <edge from-layer="5598" from-port="0" to-layer="5599" to-port="0" /> <edge from-layer="5599" from-port="1" to-layer="5600" to-port="1" /> <edge from-layer="5600" from-port="2" to-layer="5602" to-port="0" /> <edge from-layer="5601" from-port="0" to-layer="5602" to-port="1" /> <edge from-layer="5602" from-port="2" to-layer="5603" to-port="0" /> <edge from-layer="5603" from-port="1" to-layer="5604" to-port="1" /> <edge from-layer="5604" from-port="2" to-layer="5605" to-port="1" /> <edge from-layer="5605" from-port="2" to-layer="5616" to-port="0" /> <edge from-layer="5605" from-port="2" to-layer="5714" to-port="0" /> <edge from-layer="5605" from-port="2" to-layer="5609" to-port="0" /> <edge from-layer="5606" from-port="0" to-layer="5617" to-port="0" /> <edge from-layer="5607" from-port="0" to-layer="5615" to-port="0" /> <edge from-layer="5608" from-port="0" to-layer="5609" to-port="1" /> <edge from-layer="5609" from-port="2" to-layer="5611" to-port="0" /> <edge from-layer="5610" from-port="0" to-layer="5611" to-port="1" /> <edge from-layer="5611" from-port="2" to-layer="5613" to-port="0" /> <edge from-layer="5612" from-port="0" to-layer="5613" to-port="1" /> <edge from-layer="5613" from-port="2" to-layer="5614" to-port="0" /> <edge from-layer="5614" from-port="1" to-layer="5615" to-port="1" /> <edge from-layer="5615" from-port="2" to-layer="5616" to-port="1" /> <edge from-layer="5616" from-port="2" to-layer="5617" to-port="1" /> <edge from-layer="5617" from-port="2" to-layer="5691" to-port="0" /> <edge from-layer="5617" from-port="2" to-layer="5656" to-port="0" /> <edge from-layer="5617" from-port="2" to-layer="5626" to-port="0" /> <edge from-layer="5618" from-port="0" to-layer="5619" to-port="0" /> <edge from-layer="5619" from-port="1" to-layer="5622" to-port="0" /> <edge from-layer="5620" from-port="0" to-layer="5621" to-port="0" /> <edge from-layer="5621" from-port="1" to-layer="5622" to-port="1" /> <edge from-layer="5622" from-port="2" to-layer="5624" to-port="0" /> <edge from-layer="5623" from-port="0" to-layer="5624" to-port="1" /> <edge from-layer="5624" from-port="2" to-layer="5625" to-port="0" /> <edge from-layer="5625" from-port="1" to-layer="5626" to-port="1" /> <edge from-layer="5626" from-port="2" to-layer="5628" to-port="0" /> <edge from-layer="5627" from-port="0" to-layer="5628" to-port="1" /> <edge from-layer="5628" from-port="2" to-layer="5630" to-port="0" /> <edge from-layer="5629" from-port="0" to-layer="5630" to-port="1" /> <edge from-layer="5630" from-port="2" to-layer="5631" to-port="0" /> <edge from-layer="5630" from-port="2" to-layer="5635" to-port="0" /> <edge from-layer="5630" from-port="2" to-layer="5641" to-port="0" /> <edge from-layer="5631" from-port="2" to-layer="5644" to-port="0" /> <edge from-layer="5632" from-port="0" to-layer="5635" to-port="1" /> <edge from-layer="5633" from-port="0" to-layer="5635" to-port="2" /> <edge from-layer="5634" from-port="0" to-layer="5635" to-port="3" /> <edge from-layer="5635" from-port="5" to-layer="5637" to-port="0" /> <edge from-layer="5636" from-port="0" to-layer="5637" to-port="1" /> <edge from-layer="5637" from-port="2" to-layer="5642" to-port="0" /> <edge from-layer="5638" from-port="0" to-layer="5641" to-port="1" /> <edge from-layer="5639" from-port="0" to-layer="5641" to-port="2" /> <edge from-layer="5640" from-port="0" to-layer="5641" to-port="3" /> <edge from-layer="5641" from-port="5" to-layer="5642" to-port="1" /> <edge from-layer="5642" from-port="2" to-layer="5643" to-port="0" /> <edge from-layer="5643" from-port="2" to-layer="5644" to-port="1" /> <edge from-layer="5644" from-port="2" to-layer="5701" to-port="0" /> <edge from-layer="5645" from-port="1" to-layer="5647" to-port="0" /> <edge from-layer="5646" from-port="0" to-layer="5647" to-port="2" /> <edge from-layer="5647" from-port="3" to-layer="5675" to-port="0" /> <edge from-layer="5648" from-port="0" to-layer="5649" to-port="0" /> <edge from-layer="5649" from-port="1" to-layer="5652" to-port="0" /> <edge from-layer="5650" from-port="0" to-layer="5651" to-port="0" /> <edge from-layer="5651" from-port="1" to-layer="5652" to-port="1" /> <edge from-layer="5652" from-port="2" to-layer="5654" to-port="0" /> <edge from-layer="5653" from-port="0" to-layer="5654" to-port="1" /> <edge from-layer="5654" from-port="2" to-layer="5655" to-port="0" /> <edge from-layer="5655" from-port="1" to-layer="5656" to-port="1" /> <edge from-layer="5656" from-port="2" to-layer="5658" to-port="0" /> <edge from-layer="5657" from-port="0" to-layer="5658" to-port="1" /> <edge from-layer="5658" from-port="2" to-layer="5660" to-port="0" /> <edge from-layer="5659" from-port="0" to-layer="5660" to-port="1" /> <edge from-layer="5660" from-port="2" to-layer="5661" to-port="0" /> <edge from-layer="5660" from-port="2" to-layer="5665" to-port="0" /> <edge from-layer="5660" from-port="2" to-layer="5671" to-port="0" /> <edge from-layer="5661" from-port="2" to-layer="5674" to-port="0" /> <edge from-layer="5662" from-port="0" to-layer="5665" to-port="1" /> <edge from-layer="5663" from-port="0" to-layer="5665" to-port="2" /> <edge from-layer="5664" from-port="0" to-layer="5665" to-port="3" /> <edge from-layer="5665" from-port="5" to-layer="5667" to-port="0" /> <edge from-layer="5666" from-port="0" to-layer="5667" to-port="1" /> <edge from-layer="5667" from-port="2" to-layer="5672" to-port="0" /> <edge from-layer="5668" from-port="0" to-layer="5671" to-port="1" /> <edge from-layer="5669" from-port="0" to-layer="5671" to-port="2" /> <edge from-layer="5670" from-port="0" to-layer="5671" to-port="3" /> <edge from-layer="5671" from-port="5" to-layer="5672" to-port="1" /> <edge from-layer="5672" from-port="2" to-layer="5673" to-port="0" /> <edge from-layer="5673" from-port="2" to-layer="5674" to-port="1" /> <edge from-layer="5674" from-port="2" to-layer="5675" to-port="1" /> <edge from-layer="5675" from-port="2" to-layer="5676" to-port="0" /> <edge from-layer="5675" from-port="2" to-layer="6122" to-port="0" /> <edge from-layer="5676" from-port="2" to-layer="5677" to-port="0" /> <edge from-layer="5677" from-port="2" to-layer="5679" to-port="0" /> <edge from-layer="5678" from-port="0" to-layer="5679" to-port="1" /> <edge from-layer="5679" from-port="2" to-layer="5701" to-port="1" /> <edge from-layer="5680" from-port="1" to-layer="5682" to-port="0" /> <edge from-layer="5681" from-port="0" to-layer="5682" to-port="2" /> <edge from-layer="5682" from-port="3" to-layer="5696" to-port="0" /> <edge from-layer="5683" from-port="0" to-layer="5684" to-port="0" /> <edge from-layer="5684" from-port="1" to-layer="5687" to-port="0" /> <edge from-layer="5685" from-port="0" to-layer="5686" to-port="0" /> <edge from-layer="5686" from-port="1" to-layer="5687" to-port="1" /> <edge from-layer="5687" from-port="2" to-layer="5689" to-port="0" /> <edge from-layer="5688" from-port="0" to-layer="5689" to-port="1" /> <edge from-layer="5689" from-port="2" to-layer="5690" to-port="0" /> <edge from-layer="5690" from-port="1" to-layer="5691" to-port="1" /> <edge from-layer="5691" from-port="2" to-layer="5693" to-port="0" /> <edge from-layer="5692" from-port="0" to-layer="5693" to-port="1" /> <edge from-layer="5693" from-port="2" to-layer="5695" to-port="0" /> <edge from-layer="5694" from-port="0" to-layer="5695" to-port="1" /> <edge from-layer="5695" from-port="2" to-layer="5696" to-port="1" /> <edge from-layer="5696" from-port="2" to-layer="6121" to-port="0" /> <edge from-layer="5696" from-port="2" to-layer="5697" to-port="0" /> <edge from-layer="5697" from-port="2" to-layer="5698" to-port="0" /> <edge from-layer="5698" from-port="2" to-layer="5700" to-port="0" /> <edge from-layer="5699" from-port="0" to-layer="5700" to-port="1" /> <edge from-layer="5700" from-port="2" to-layer="5701" to-port="2" /> <edge from-layer="5701" from-port="4" to-layer="5703" to-port="0" /> <edge from-layer="5702" from-port="0" to-layer="5703" to-port="1" /> <edge from-layer="5703" from-port="2" to-layer="5704" to-port="0" /> <edge from-layer="5704" from-port="2" to-layer="5713" to-port="0" /> <edge from-layer="5705" from-port="0" to-layer="5706" to-port="0" /> <edge from-layer="5706" from-port="1" to-layer="5709" to-port="0" /> <edge from-layer="5707" from-port="0" to-layer="5708" to-port="0" /> <edge from-layer="5708" from-port="1" to-layer="5709" to-port="1" /> <edge from-layer="5709" from-port="2" to-layer="5711" to-port="0" /> <edge from-layer="5710" from-port="0" to-layer="5711" to-port="1" /> <edge from-layer="5711" from-port="2" to-layer="5712" to-port="0" /> <edge from-layer="5712" from-port="1" to-layer="5713" to-port="1" /> <edge from-layer="5713" from-port="2" to-layer="5714" to-port="1" /> <edge from-layer="5714" from-port="2" to-layer="5756" to-port="0" /> <edge from-layer="5714" from-port="2" to-layer="5725" to-port="0" /> <edge from-layer="5714" from-port="2" to-layer="5718" to-port="0" /> <edge from-layer="5715" from-port="0" to-layer="5726" to-port="0" /> <edge from-layer="5716" from-port="0" to-layer="5724" to-port="0" /> <edge from-layer="5717" from-port="0" to-layer="5718" to-port="1" /> <edge from-layer="5718" from-port="2" to-layer="5720" to-port="0" /> <edge from-layer="5719" from-port="0" to-layer="5720" to-port="1" /> <edge from-layer="5720" from-port="2" to-layer="5722" to-port="0" /> <edge from-layer="5721" from-port="0" to-layer="5722" to-port="1" /> <edge from-layer="5722" from-port="2" to-layer="5723" to-port="0" /> <edge from-layer="5723" from-port="1" to-layer="5724" to-port="1" /> <edge from-layer="5724" from-port="2" to-layer="5725" to-port="1" /> <edge from-layer="5725" from-port="2" to-layer="5726" to-port="1" /> <edge from-layer="5726" from-port="2" to-layer="5745" to-port="0" /> <edge from-layer="5726" from-port="2" to-layer="5735" to-port="0" /> <edge from-layer="5727" from-port="0" to-layer="5728" to-port="0" /> <edge from-layer="5728" from-port="1" to-layer="5731" to-port="0" /> <edge from-layer="5729" from-port="0" to-layer="5730" to-port="0" /> <edge from-layer="5730" from-port="1" to-layer="5731" to-port="1" /> <edge from-layer="5731" from-port="2" to-layer="5733" to-port="0" /> <edge from-layer="5732" from-port="0" to-layer="5733" to-port="1" /> <edge from-layer="5733" from-port="2" to-layer="5734" to-port="0" /> <edge from-layer="5734" from-port="1" to-layer="5735" to-port="1" /> <edge from-layer="5735" from-port="2" to-layer="5736" to-port="0" /> <edge from-layer="5736" from-port="1" to-layer="5746" to-port="0" /> <edge from-layer="5737" from-port="0" to-layer="5738" to-port="0" /> <edge from-layer="5738" from-port="1" to-layer="5741" to-port="0" /> <edge from-layer="5739" from-port="0" to-layer="5740" to-port="0" /> <edge from-layer="5740" from-port="1" to-layer="5741" to-port="1" /> <edge from-layer="5741" from-port="2" to-layer="5743" to-port="0" /> <edge from-layer="5742" from-port="0" to-layer="5743" to-port="1" /> <edge from-layer="5743" from-port="2" to-layer="5744" to-port="0" /> <edge from-layer="5744" from-port="1" to-layer="5745" to-port="1" /> <edge from-layer="5745" from-port="2" to-layer="5746" to-port="1" /> <edge from-layer="5746" from-port="2" to-layer="5755" to-port="0" /> <edge from-layer="5747" from-port="0" to-layer="5748" to-port="0" /> <edge from-layer="5748" from-port="1" to-layer="5751" to-port="0" /> <edge from-layer="5749" from-port="0" to-layer="5750" to-port="0" /> <edge from-layer="5750" from-port="1" to-layer="5751" to-port="1" /> <edge from-layer="5751" from-port="2" to-layer="5753" to-port="0" /> <edge from-layer="5752" from-port="0" to-layer="5753" to-port="1" /> <edge from-layer="5753" from-port="2" to-layer="5754" to-port="0" /> <edge from-layer="5754" from-port="1" to-layer="5755" to-port="1" /> <edge from-layer="5755" from-port="2" to-layer="5756" to-port="1" /> <edge from-layer="5756" from-port="2" to-layer="5767" to-port="0" /> <edge from-layer="5756" from-port="2" to-layer="5865" to-port="0" /> <edge from-layer="5756" from-port="2" to-layer="5760" to-port="0" /> <edge from-layer="5757" from-port="0" to-layer="5768" to-port="0" /> <edge from-layer="5758" from-port="0" to-layer="5766" to-port="0" /> <edge from-layer="5759" from-port="0" to-layer="5760" to-port="1" /> <edge from-layer="5760" from-port="2" to-layer="5762" to-port="0" /> <edge from-layer="5761" from-port="0" to-layer="5762" to-port="1" /> <edge from-layer="5762" from-port="2" to-layer="5764" to-port="0" /> <edge from-layer="5763" from-port="0" to-layer="5764" to-port="1" /> <edge from-layer="5764" from-port="2" to-layer="5765" to-port="0" /> <edge from-layer="5765" from-port="1" to-layer="5766" to-port="1" /> <edge from-layer="5766" from-port="2" to-layer="5767" to-port="1" /> <edge from-layer="5767" from-port="2" to-layer="5768" to-port="1" /> <edge from-layer="5768" from-port="2" to-layer="5807" to-port="0" /> <edge from-layer="5768" from-port="2" to-layer="5842" to-port="0" /> <edge from-layer="5768" from-port="2" to-layer="5777" to-port="0" /> <edge from-layer="5769" from-port="0" to-layer="5770" to-port="0" /> <edge from-layer="5770" from-port="1" to-layer="5773" to-port="0" /> <edge from-layer="5771" from-port="0" to-layer="5772" to-port="0" /> <edge from-layer="5772" from-port="1" to-layer="5773" to-port="1" /> <edge from-layer="5773" from-port="2" to-layer="5775" to-port="0" /> <edge from-layer="5774" from-port="0" to-layer="5775" to-port="1" /> <edge from-layer="5775" from-port="2" to-layer="5776" to-port="0" /> <edge from-layer="5776" from-port="1" to-layer="5777" to-port="1" /> <edge from-layer="5777" from-port="2" to-layer="5779" to-port="0" /> <edge from-layer="5778" from-port="0" to-layer="5779" to-port="1" /> <edge from-layer="5779" from-port="2" to-layer="5781" to-port="0" /> <edge from-layer="5780" from-port="0" to-layer="5781" to-port="1" /> <edge from-layer="5781" from-port="2" to-layer="5782" to-port="0" /> <edge from-layer="5781" from-port="2" to-layer="5786" to-port="0" /> <edge from-layer="5781" from-port="2" to-layer="5792" to-port="0" /> <edge from-layer="5782" from-port="2" to-layer="5795" to-port="0" /> <edge from-layer="5783" from-port="0" to-layer="5786" to-port="1" /> <edge from-layer="5784" from-port="0" to-layer="5786" to-port="2" /> <edge from-layer="5785" from-port="0" to-layer="5786" to-port="3" /> <edge from-layer="5786" from-port="5" to-layer="5788" to-port="0" /> <edge from-layer="5787" from-port="0" to-layer="5788" to-port="1" /> <edge from-layer="5788" from-port="2" to-layer="5793" to-port="0" /> <edge from-layer="5789" from-port="0" to-layer="5792" to-port="1" /> <edge from-layer="5790" from-port="0" to-layer="5792" to-port="2" /> <edge from-layer="5791" from-port="0" to-layer="5792" to-port="3" /> <edge from-layer="5792" from-port="5" to-layer="5793" to-port="1" /> <edge from-layer="5793" from-port="2" to-layer="5794" to-port="0" /> <edge from-layer="5794" from-port="2" to-layer="5795" to-port="1" /> <edge from-layer="5795" from-port="2" to-layer="5852" to-port="0" /> <edge from-layer="5796" from-port="1" to-layer="5798" to-port="0" /> <edge from-layer="5797" from-port="0" to-layer="5798" to-port="2" /> <edge from-layer="5798" from-port="3" to-layer="5826" to-port="0" /> <edge from-layer="5799" from-port="0" to-layer="5800" to-port="0" /> <edge from-layer="5800" from-port="1" to-layer="5803" to-port="0" /> <edge from-layer="5801" from-port="0" to-layer="5802" to-port="0" /> <edge from-layer="5802" from-port="1" to-layer="5803" to-port="1" /> <edge from-layer="5803" from-port="2" to-layer="5805" to-port="0" /> <edge from-layer="5804" from-port="0" to-layer="5805" to-port="1" /> <edge from-layer="5805" from-port="2" to-layer="5806" to-port="0" /> <edge from-layer="5806" from-port="1" to-layer="5807" to-port="1" /> <edge from-layer="5807" from-port="2" to-layer="5809" to-port="0" /> <edge from-layer="5808" from-port="0" to-layer="5809" to-port="1" /> <edge from-layer="5809" from-port="2" to-layer="5811" to-port="0" /> <edge from-layer="5810" from-port="0" to-layer="5811" to-port="1" /> <edge from-layer="5811" from-port="2" to-layer="5812" to-port="0" /> <edge from-layer="5811" from-port="2" to-layer="5816" to-port="0" /> <edge from-layer="5811" from-port="2" to-layer="5822" to-port="0" /> <edge from-layer="5812" from-port="2" to-layer="5825" to-port="0" /> <edge from-layer="5813" from-port="0" to-layer="5816" to-port="1" /> <edge from-layer="5814" from-port="0" to-layer="5816" to-port="2" /> <edge from-layer="5815" from-port="0" to-layer="5816" to-port="3" /> <edge from-layer="5816" from-port="5" to-layer="5818" to-port="0" /> <edge from-layer="5817" from-port="0" to-layer="5818" to-port="1" /> <edge from-layer="5818" from-port="2" to-layer="5823" to-port="0" /> <edge from-layer="5819" from-port="0" to-layer="5822" to-port="1" /> <edge from-layer="5820" from-port="0" to-layer="5822" to-port="2" /> <edge from-layer="5821" from-port="0" to-layer="5822" to-port="3" /> <edge from-layer="5822" from-port="5" to-layer="5823" to-port="1" /> <edge from-layer="5823" from-port="2" to-layer="5824" to-port="0" /> <edge from-layer="5824" from-port="2" to-layer="5825" to-port="1" /> <edge from-layer="5825" from-port="2" to-layer="5826" to-port="1" /> <edge from-layer="5826" from-port="2" to-layer="6120" to-port="0" /> <edge from-layer="5826" from-port="2" to-layer="5827" to-port="0" /> <edge from-layer="5827" from-port="2" to-layer="5828" to-port="0" /> <edge from-layer="5828" from-port="2" to-layer="5830" to-port="0" /> <edge from-layer="5829" from-port="0" to-layer="5830" to-port="1" /> <edge from-layer="5830" from-port="2" to-layer="5852" to-port="1" /> <edge from-layer="5831" from-port="1" to-layer="5833" to-port="0" /> <edge from-layer="5832" from-port="0" to-layer="5833" to-port="2" /> <edge from-layer="5833" from-port="3" to-layer="5847" to-port="0" /> <edge from-layer="5834" from-port="0" to-layer="5835" to-port="0" /> <edge from-layer="5835" from-port="1" to-layer="5838" to-port="0" /> <edge from-layer="5836" from-port="0" to-layer="5837" to-port="0" /> <edge from-layer="5837" from-port="1" to-layer="5838" to-port="1" /> <edge from-layer="5838" from-port="2" to-layer="5840" to-port="0" /> <edge from-layer="5839" from-port="0" to-layer="5840" to-port="1" /> <edge from-layer="5840" from-port="2" to-layer="5841" to-port="0" /> <edge from-layer="5841" from-port="1" to-layer="5842" to-port="1" /> <edge from-layer="5842" from-port="2" to-layer="5844" to-port="0" /> <edge from-layer="5843" from-port="0" to-layer="5844" to-port="1" /> <edge from-layer="5844" from-port="2" to-layer="5846" to-port="0" /> <edge from-layer="5845" from-port="0" to-layer="5846" to-port="1" /> <edge from-layer="5846" from-port="2" to-layer="5847" to-port="1" /> <edge from-layer="5847" from-port="2" to-layer="6119" to-port="0" /> <edge from-layer="5847" from-port="2" to-layer="5848" to-port="0" /> <edge from-layer="5848" from-port="2" to-layer="5849" to-port="0" /> <edge from-layer="5849" from-port="2" to-layer="5851" to-port="0" /> <edge from-layer="5850" from-port="0" to-layer="5851" to-port="1" /> <edge from-layer="5851" from-port="2" to-layer="5852" to-port="2" /> <edge from-layer="5852" from-port="4" to-layer="5854" to-port="0" /> <edge from-layer="5853" from-port="0" to-layer="5854" to-port="1" /> <edge from-layer="5854" from-port="2" to-layer="5855" to-port="0" /> <edge from-layer="5855" from-port="2" to-layer="5864" to-port="0" /> <edge from-layer="5856" from-port="0" to-layer="5857" to-port="0" /> <edge from-layer="5857" from-port="1" to-layer="5860" to-port="0" /> <edge from-layer="5858" from-port="0" to-layer="5859" to-port="0" /> <edge from-layer="5859" from-port="1" to-layer="5860" to-port="1" /> <edge from-layer="5860" from-port="2" to-layer="5862" to-port="0" /> <edge from-layer="5861" from-port="0" to-layer="5862" to-port="1" /> <edge from-layer="5862" from-port="2" to-layer="5863" to-port="0" /> <edge from-layer="5863" from-port="1" to-layer="5864" to-port="1" /> <edge from-layer="5864" from-port="2" to-layer="5865" to-port="1" /> <edge from-layer="5865" from-port="2" to-layer="5869" to-port="0" /> <edge from-layer="5865" from-port="2" to-layer="5907" to-port="0" /> <edge from-layer="5865" from-port="2" to-layer="5876" to-port="0" /> <edge from-layer="5866" from-port="0" to-layer="5877" to-port="0" /> <edge from-layer="5867" from-port="0" to-layer="5875" to-port="0" /> <edge from-layer="5868" from-port="0" to-layer="5869" to-port="1" /> <edge from-layer="5869" from-port="2" to-layer="5871" to-port="0" /> <edge from-layer="5870" from-port="0" to-layer="5871" to-port="1" /> <edge from-layer="5871" from-port="2" to-layer="5873" to-port="0" /> <edge from-layer="5872" from-port="0" to-layer="5873" to-port="1" /> <edge from-layer="5873" from-port="2" to-layer="5874" to-port="0" /> <edge from-layer="5874" from-port="1" to-layer="5875" to-port="1" /> <edge from-layer="5875" from-port="2" to-layer="5876" to-port="1" /> <edge from-layer="5876" from-port="2" to-layer="5877" to-port="1" /> <edge from-layer="5877" from-port="2" to-layer="5896" to-port="0" /> <edge from-layer="5877" from-port="2" to-layer="5886" to-port="0" /> <edge from-layer="5878" from-port="0" to-layer="5879" to-port="0" /> <edge from-layer="5879" from-port="1" to-layer="5882" to-port="0" /> <edge from-layer="5880" from-port="0" to-layer="5881" to-port="0" /> <edge from-layer="5881" from-port="1" to-layer="5882" to-port="1" /> <edge from-layer="5882" from-port="2" to-layer="5884" to-port="0" /> <edge from-layer="5883" from-port="0" to-layer="5884" to-port="1" /> <edge from-layer="5884" from-port="2" to-layer="5885" to-port="0" /> <edge from-layer="5885" from-port="1" to-layer="5886" to-port="1" /> <edge from-layer="5886" from-port="2" to-layer="5887" to-port="0" /> <edge from-layer="5887" from-port="1" to-layer="5897" to-port="0" /> <edge from-layer="5888" from-port="0" to-layer="5889" to-port="0" /> <edge from-layer="5889" from-port="1" to-layer="5892" to-port="0" /> <edge from-layer="5890" from-port="0" to-layer="5891" to-port="0" /> <edge from-layer="5891" from-port="1" to-layer="5892" to-port="1" /> <edge from-layer="5892" from-port="2" to-layer="5894" to-port="0" /> <edge from-layer="5893" from-port="0" to-layer="5894" to-port="1" /> <edge from-layer="5894" from-port="2" to-layer="5895" to-port="0" /> <edge from-layer="5895" from-port="1" to-layer="5896" to-port="1" /> <edge from-layer="5896" from-port="2" to-layer="5897" to-port="1" /> <edge from-layer="5897" from-port="2" to-layer="5906" to-port="0" /> <edge from-layer="5898" from-port="0" to-layer="5899" to-port="0" /> <edge from-layer="5899" from-port="1" to-layer="5902" to-port="0" /> <edge from-layer="5900" from-port="0" to-layer="5901" to-port="0" /> <edge from-layer="5901" from-port="1" to-layer="5902" to-port="1" /> <edge from-layer="5902" from-port="2" to-layer="5904" to-port="0" /> <edge from-layer="5903" from-port="0" to-layer="5904" to-port="1" /> <edge from-layer="5904" from-port="2" to-layer="5905" to-port="0" /> <edge from-layer="5905" from-port="1" to-layer="5906" to-port="1" /> <edge from-layer="5906" from-port="2" to-layer="5907" to-port="1" /> <edge from-layer="5907" from-port="2" to-layer="5918" to-port="0" /> <edge from-layer="5907" from-port="2" to-layer="5911" to-port="0" /> <edge from-layer="5907" from-port="2" to-layer="6016" to-port="0" /> <edge from-layer="5908" from-port="0" to-layer="5919" to-port="0" /> <edge from-layer="5909" from-port="0" to-layer="5917" to-port="0" /> <edge from-layer="5910" from-port="0" to-layer="5911" to-port="1" /> <edge from-layer="5911" from-port="2" to-layer="5913" to-port="0" /> <edge from-layer="5912" from-port="0" to-layer="5913" to-port="1" /> <edge from-layer="5913" from-port="2" to-layer="5915" to-port="0" /> <edge from-layer="5914" from-port="0" to-layer="5915" to-port="1" /> <edge from-layer="5915" from-port="2" to-layer="5916" to-port="0" /> <edge from-layer="5916" from-port="1" to-layer="5917" to-port="1" /> <edge from-layer="5917" from-port="2" to-layer="5918" to-port="1" /> <edge from-layer="5918" from-port="2" to-layer="5919" to-port="1" /> <edge from-layer="5919" from-port="2" to-layer="5993" to-port="0" /> <edge from-layer="5919" from-port="2" to-layer="5958" to-port="0" /> <edge from-layer="5919" from-port="2" to-layer="5928" to-port="0" /> <edge from-layer="5920" from-port="0" to-layer="5921" to-port="0" /> <edge from-layer="5921" from-port="1" to-layer="5924" to-port="0" /> <edge from-layer="5922" from-port="0" to-layer="5923" to-port="0" /> <edge from-layer="5923" from-port="1" to-layer="5924" to-port="1" /> <edge from-layer="5924" from-port="2" to-layer="5926" to-port="0" /> <edge from-layer="5925" from-port="0" to-layer="5926" to-port="1" /> <edge from-layer="5926" from-port="2" to-layer="5927" to-port="0" /> <edge from-layer="5927" from-port="1" to-layer="5928" to-port="1" /> <edge from-layer="5928" from-port="2" to-layer="5930" to-port="0" /> <edge from-layer="5929" from-port="0" to-layer="5930" to-port="1" /> <edge from-layer="5930" from-port="2" to-layer="5932" to-port="0" /> <edge from-layer="5931" from-port="0" to-layer="5932" to-port="1" /> <edge from-layer="5932" from-port="2" to-layer="5937" to-port="0" /> <edge from-layer="5932" from-port="2" to-layer="5933" to-port="0" /> <edge from-layer="5932" from-port="2" to-layer="5943" to-port="0" /> <edge from-layer="5933" from-port="2" to-layer="5946" to-port="0" /> <edge from-layer="5934" from-port="0" to-layer="5937" to-port="1" /> <edge from-layer="5935" from-port="0" to-layer="5937" to-port="2" /> <edge from-layer="5936" from-port="0" to-layer="5937" to-port="3" /> <edge from-layer="5937" from-port="5" to-layer="5939" to-port="0" /> <edge from-layer="5938" from-port="0" to-layer="5939" to-port="1" /> <edge from-layer="5939" from-port="2" to-layer="5944" to-port="0" /> <edge from-layer="5940" from-port="0" to-layer="5943" to-port="1" /> <edge from-layer="5941" from-port="0" to-layer="5943" to-port="2" /> <edge from-layer="5942" from-port="0" to-layer="5943" to-port="3" /> <edge from-layer="5943" from-port="5" to-layer="5944" to-port="1" /> <edge from-layer="5944" from-port="2" to-layer="5945" to-port="0" /> <edge from-layer="5945" from-port="2" to-layer="5946" to-port="1" /> <edge from-layer="5946" from-port="2" to-layer="6003" to-port="0" /> <edge from-layer="5947" from-port="1" to-layer="5949" to-port="0" /> <edge from-layer="5948" from-port="0" to-layer="5949" to-port="2" /> <edge from-layer="5949" from-port="3" to-layer="5977" to-port="0" /> <edge from-layer="5950" from-port="0" to-layer="5951" to-port="0" /> <edge from-layer="5951" from-port="1" to-layer="5954" to-port="0" /> <edge from-layer="5952" from-port="0" to-layer="5953" to-port="0" /> <edge from-layer="5953" from-port="1" to-layer="5954" to-port="1" /> <edge from-layer="5954" from-port="2" to-layer="5956" to-port="0" /> <edge from-layer="5955" from-port="0" to-layer="5956" to-port="1" /> <edge from-layer="5956" from-port="2" to-layer="5957" to-port="0" /> <edge from-layer="5957" from-port="1" to-layer="5958" to-port="1" /> <edge from-layer="5958" from-port="2" to-layer="5960" to-port="0" /> <edge from-layer="5959" from-port="0" to-layer="5960" to-port="1" /> <edge from-layer="5960" from-port="2" to-layer="5962" to-port="0" /> <edge from-layer="5961" from-port="0" to-layer="5962" to-port="1" /> <edge from-layer="5962" from-port="2" to-layer="5967" to-port="0" /> <edge from-layer="5962" from-port="2" to-layer="5973" to-port="0" /> <edge from-layer="5962" from-port="2" to-layer="5963" to-port="0" /> <edge from-layer="5963" from-port="2" to-layer="5976" to-port="0" /> <edge from-layer="5964" from-port="0" to-layer="5967" to-port="1" /> <edge from-layer="5965" from-port="0" to-layer="5967" to-port="2" /> <edge from-layer="5966" from-port="0" to-layer="5967" to-port="3" /> <edge from-layer="5967" from-port="5" to-layer="5969" to-port="0" /> <edge from-layer="5968" from-port="0" to-layer="5969" to-port="1" /> <edge from-layer="5969" from-port="2" to-layer="5974" to-port="0" /> <edge from-layer="5970" from-port="0" to-layer="5973" to-port="1" /> <edge from-layer="5971" from-port="0" to-layer="5973" to-port="2" /> <edge from-layer="5972" from-port="0" to-layer="5973" to-port="3" /> <edge from-layer="5973" from-port="5" to-layer="5974" to-port="1" /> <edge from-layer="5974" from-port="2" to-layer="5975" to-port="0" /> <edge from-layer="5975" from-port="2" to-layer="5976" to-port="1" /> <edge from-layer="5976" from-port="2" to-layer="5977" to-port="1" /> <edge from-layer="5977" from-port="2" to-layer="6118" to-port="0" /> <edge from-layer="5977" from-port="2" to-layer="5978" to-port="0" /> <edge from-layer="5978" from-port="2" to-layer="5979" to-port="0" /> <edge from-layer="5979" from-port="2" to-layer="5981" to-port="0" /> <edge from-layer="5980" from-port="0" to-layer="5981" to-port="1" /> <edge from-layer="5981" from-port="2" to-layer="6003" to-port="1" /> <edge from-layer="5982" from-port="1" to-layer="5984" to-port="0" /> <edge from-layer="5983" from-port="0" to-layer="5984" to-port="2" /> <edge from-layer="5984" from-port="3" to-layer="5998" to-port="0" /> <edge from-layer="5985" from-port="0" to-layer="5986" to-port="0" /> <edge from-layer="5986" from-port="1" to-layer="5989" to-port="0" /> <edge from-layer="5987" from-port="0" to-layer="5988" to-port="0" /> <edge from-layer="5988" from-port="1" to-layer="5989" to-port="1" /> <edge from-layer="5989" from-port="2" to-layer="5991" to-port="0" /> <edge from-layer="5990" from-port="0" to-layer="5991" to-port="1" /> <edge from-layer="5991" from-port="2" to-layer="5992" to-port="0" /> <edge from-layer="5992" from-port="1" to-layer="5993" to-port="1" /> <edge from-layer="5993" from-port="2" to-layer="5995" to-port="0" /> <edge from-layer="5994" from-port="0" to-layer="5995" to-port="1" /> <edge from-layer="5995" from-port="2" to-layer="5997" to-port="0" /> <edge from-layer="5996" from-port="0" to-layer="5997" to-port="1" /> <edge from-layer="5997" from-port="2" to-layer="5998" to-port="1" /> <edge from-layer="5998" from-port="2" to-layer="6117" to-port="0" /> <edge from-layer="5998" from-port="2" to-layer="5999" to-port="0" /> <edge from-layer="5999" from-port="2" to-layer="6000" to-port="0" /> <edge from-layer="6000" from-port="2" to-layer="6002" to-port="0" /> <edge from-layer="6001" from-port="0" to-layer="6002" to-port="1" /> <edge from-layer="6002" from-port="2" to-layer="6003" to-port="2" /> <edge from-layer="6003" from-port="4" to-layer="6005" to-port="0" /> <edge from-layer="6004" from-port="0" to-layer="6005" to-port="1" /> <edge from-layer="6005" from-port="2" to-layer="6006" to-port="0" /> <edge from-layer="6006" from-port="2" to-layer="6015" to-port="0" /> <edge from-layer="6007" from-port="0" to-layer="6008" to-port="0" /> <edge from-layer="6008" from-port="1" to-layer="6011" to-port="0" /> <edge from-layer="6009" from-port="0" to-layer="6010" to-port="0" /> <edge from-layer="6010" from-port="1" to-layer="6011" to-port="1" /> <edge from-layer="6011" from-port="2" to-layer="6013" to-port="0" /> <edge from-layer="6012" from-port="0" to-layer="6013" to-port="1" /> <edge from-layer="6013" from-port="2" to-layer="6014" to-port="0" /> <edge from-layer="6014" from-port="1" to-layer="6015" to-port="1" /> <edge from-layer="6015" from-port="2" to-layer="6016" to-port="1" /> <edge from-layer="6016" from-port="2" to-layer="6020" to-port="0" /> <edge from-layer="6016" from-port="2" to-layer="6027" to-port="0" /> <edge from-layer="6016" from-port="2" to-layer="6058" to-port="0" /> <edge from-layer="6017" from-port="0" to-layer="6028" to-port="0" /> <edge from-layer="6018" from-port="0" to-layer="6026" to-port="0" /> <edge from-layer="6019" from-port="0" to-layer="6020" to-port="1" /> <edge from-layer="6020" from-port="2" to-layer="6022" to-port="0" /> <edge from-layer="6021" from-port="0" to-layer="6022" to-port="1" /> <edge from-layer="6022" from-port="2" to-layer="6024" to-port="0" /> <edge from-layer="6023" from-port="0" to-layer="6024" to-port="1" /> <edge from-layer="6024" from-port="2" to-layer="6025" to-port="0" /> <edge from-layer="6025" from-port="1" to-layer="6026" to-port="1" /> <edge from-layer="6026" from-port="2" to-layer="6027" to-port="1" /> <edge from-layer="6027" from-port="2" to-layer="6028" to-port="1" /> <edge from-layer="6028" from-port="2" to-layer="6037" to-port="0" /> <edge from-layer="6028" from-port="2" to-layer="6047" to-port="0" /> <edge from-layer="6029" from-port="0" to-layer="6030" to-port="0" /> <edge from-layer="6030" from-port="1" to-layer="6033" to-port="0" /> <edge from-layer="6031" from-port="0" to-layer="6032" to-port="0" /> <edge from-layer="6032" from-port="1" to-layer="6033" to-port="1" /> <edge from-layer="6033" from-port="2" to-layer="6035" to-port="0" /> <edge from-layer="6034" from-port="0" to-layer="6035" to-port="1" /> <edge from-layer="6035" from-port="2" to-layer="6036" to-port="0" /> <edge from-layer="6036" from-port="1" to-layer="6037" to-port="1" /> <edge from-layer="6037" from-port="2" to-layer="6038" to-port="0" /> <edge from-layer="6038" from-port="1" to-layer="6048" to-port="0" /> <edge from-layer="6039" from-port="0" to-layer="6040" to-port="0" /> <edge from-layer="6040" from-port="1" to-layer="6043" to-port="0" /> <edge from-layer="6041" from-port="0" to-layer="6042" to-port="0" /> <edge from-layer="6042" from-port="1" to-layer="6043" to-port="1" /> <edge from-layer="6043" from-port="2" to-layer="6045" to-port="0" /> <edge from-layer="6044" from-port="0" to-layer="6045" to-port="1" /> <edge from-layer="6045" from-port="2" to-layer="6046" to-port="0" /> <edge from-layer="6046" from-port="1" to-layer="6047" to-port="1" /> <edge from-layer="6047" from-port="2" to-layer="6048" to-port="1" /> <edge from-layer="6048" from-port="2" to-layer="6057" to-port="0" /> <edge from-layer="6049" from-port="0" to-layer="6050" to-port="0" /> <edge from-layer="6050" from-port="1" to-layer="6053" to-port="0" /> <edge from-layer="6051" from-port="0" to-layer="6052" to-port="0" /> <edge from-layer="6052" from-port="1" to-layer="6053" to-port="1" /> <edge from-layer="6053" from-port="2" to-layer="6055" to-port="0" /> <edge from-layer="6054" from-port="0" to-layer="6055" to-port="1" /> <edge from-layer="6055" from-port="2" to-layer="6056" to-port="0" /> <edge from-layer="6056" from-port="1" to-layer="6057" to-port="1" /> <edge from-layer="6057" from-port="2" to-layer="6058" to-port="1" /> <edge from-layer="6058" from-port="2" to-layer="6061" to-port="0" /> <edge from-layer="6058" from-port="2" to-layer="6232" to-port="0" /> <edge from-layer="6058" from-port="2" to-layer="6068" to-port="0" /> <edge from-layer="6059" from-port="0" to-layer="6067" to-port="0" /> <edge from-layer="6060" from-port="0" to-layer="6061" to-port="1" /> <edge from-layer="6061" from-port="2" to-layer="6063" to-port="0" /> <edge from-layer="6062" from-port="0" to-layer="6063" to-port="1" /> <edge from-layer="6063" from-port="2" to-layer="6065" to-port="0" /> <edge from-layer="6064" from-port="0" to-layer="6065" to-port="1" /> <edge from-layer="6065" from-port="2" to-layer="6066" to-port="0" /> <edge from-layer="6066" from-port="1" to-layer="6067" to-port="1" /> <edge from-layer="6067" from-port="2" to-layer="6068" to-port="1" /> <edge from-layer="6068" from-port="2" to-layer="6069" to-port="1" /> <edge from-layer="6069" from-port="2" to-layer="6192" to-port="0" /> <edge from-layer="6069" from-port="2" to-layer="6078" to-port="0" /> <edge from-layer="6069" from-port="2" to-layer="6096" to-port="0" /> <edge from-layer="6070" from-port="0" to-layer="6071" to-port="0" /> <edge from-layer="6071" from-port="1" to-layer="6074" to-port="0" /> <edge from-layer="6072" from-port="0" to-layer="6073" to-port="0" /> <edge from-layer="6073" from-port="1" to-layer="6074" to-port="1" /> <edge from-layer="6074" from-port="2" to-layer="6076" to-port="0" /> <edge from-layer="6075" from-port="0" to-layer="6076" to-port="1" /> <edge from-layer="6076" from-port="2" to-layer="6077" to-port="0" /> <edge from-layer="6077" from-port="1" to-layer="6078" to-port="1" /> <edge from-layer="6078" from-port="2" to-layer="6080" to-port="0" /> <edge from-layer="6079" from-port="0" to-layer="6080" to-port="1" /> <edge from-layer="6080" from-port="2" to-layer="6082" to-port="0" /> <edge from-layer="6081" from-port="0" to-layer="6082" to-port="1" /> <edge from-layer="6082" from-port="2" to-layer="6083" to-port="1" /> <edge from-layer="6083" from-port="2" to-layer="6215" to-port="0" /> <edge from-layer="6083" from-port="2" to-layer="6084" to-port="0" /> <edge from-layer="6085" from-port="1" to-layer="6087" to-port="0" /> <edge from-layer="6086" from-port="0" to-layer="6087" to-port="2" /> <edge from-layer="6087" from-port="3" to-layer="6115" to-port="0" /> <edge from-layer="6088" from-port="0" to-layer="6089" to-port="0" /> <edge from-layer="6089" from-port="1" to-layer="6092" to-port="0" /> <edge from-layer="6090" from-port="0" to-layer="6091" to-port="0" /> <edge from-layer="6091" from-port="1" to-layer="6092" to-port="1" /> <edge from-layer="6092" from-port="2" to-layer="6094" to-port="0" /> <edge from-layer="6093" from-port="0" to-layer="6094" to-port="1" /> <edge from-layer="6094" from-port="2" to-layer="6095" to-port="0" /> <edge from-layer="6095" from-port="1" to-layer="6096" to-port="1" /> <edge from-layer="6096" from-port="2" to-layer="6098" to-port="0" /> <edge from-layer="6097" from-port="0" to-layer="6098" to-port="1" /> <edge from-layer="6098" from-port="2" to-layer="6100" to-port="0" /> <edge from-layer="6099" from-port="0" to-layer="6100" to-port="1" /> <edge from-layer="6100" from-port="2" to-layer="6101" to-port="0" /> <edge from-layer="6100" from-port="2" to-layer="6105" to-port="0" /> <edge from-layer="6100" from-port="2" to-layer="6111" to-port="0" /> <edge from-layer="6101" from-port="2" to-layer="6114" to-port="0" /> <edge from-layer="6102" from-port="0" to-layer="6105" to-port="1" /> <edge from-layer="6103" from-port="0" to-layer="6105" to-port="2" /> <edge from-layer="6104" from-port="0" to-layer="6105" to-port="3" /> <edge from-layer="6105" from-port="5" to-layer="6107" to-port="0" /> <edge from-layer="6106" from-port="0" to-layer="6107" to-port="1" /> <edge from-layer="6107" from-port="2" to-layer="6112" to-port="0" /> <edge from-layer="6108" from-port="0" to-layer="6111" to-port="1" /> <edge from-layer="6109" from-port="0" to-layer="6111" to-port="2" /> <edge from-layer="6110" from-port="0" to-layer="6111" to-port="3" /> <edge from-layer="6111" from-port="5" to-layer="6112" to-port="1" /> <edge from-layer="6112" from-port="2" to-layer="6113" to-port="0" /> <edge from-layer="6113" from-port="2" to-layer="6114" to-port="1" /> <edge from-layer="6114" from-port="2" to-layer="6115" to-port="1" /> <edge from-layer="6115" from-port="2" to-layer="6116" to-port="0" /> <edge from-layer="6115" from-port="2" to-layer="6211" to-port="0" /> <edge from-layer="6183" from-port="0" to-layer="6285" to-port="0" /> <edge from-layer="6184" from-port="0" to-layer="6185" to-port="0" /> <edge from-layer="6185" from-port="1" to-layer="6188" to-port="0" /> <edge from-layer="6186" from-port="0" to-layer="6187" to-port="0" /> <edge from-layer="6187" from-port="1" to-layer="6188" to-port="1" /> <edge from-layer="6188" from-port="2" to-layer="6190" to-port="0" /> <edge from-layer="6189" from-port="0" to-layer="6190" to-port="1" /> <edge from-layer="6190" from-port="2" to-layer="6191" to-port="0" /> <edge from-layer="6191" from-port="1" to-layer="6192" to-port="1" /> <edge from-layer="6192" from-port="2" to-layer="6194" to-port="0" /> <edge from-layer="6193" from-port="0" to-layer="6194" to-port="1" /> <edge from-layer="6194" from-port="2" to-layer="6196" to-port="0" /> <edge from-layer="6195" from-port="0" to-layer="6196" to-port="1" /> <edge from-layer="6196" from-port="2" to-layer="6207" to-port="0" /> <edge from-layer="6196" from-port="2" to-layer="6201" to-port="0" /> <edge from-layer="6196" from-port="2" to-layer="6197" to-port="0" /> <edge from-layer="6197" from-port="2" to-layer="6210" to-port="0" /> <edge from-layer="6198" from-port="0" to-layer="6201" to-port="1" /> <edge from-layer="6199" from-port="0" to-layer="6201" to-port="2" /> <edge from-layer="6200" from-port="0" to-layer="6201" to-port="3" /> <edge from-layer="6201" from-port="5" to-layer="6203" to-port="0" /> <edge from-layer="6202" from-port="0" to-layer="6203" to-port="1" /> <edge from-layer="6203" from-port="2" to-layer="6208" to-port="0" /> <edge from-layer="6204" from-port="0" to-layer="6207" to-port="1" /> <edge from-layer="6205" from-port="0" to-layer="6207" to-port="2" /> <edge from-layer="6206" from-port="0" to-layer="6207" to-port="3" /> <edge from-layer="6207" from-port="5" to-layer="6208" to-port="1" /> <edge from-layer="6208" from-port="2" to-layer="6209" to-port="0" /> <edge from-layer="6209" from-port="2" to-layer="6210" to-port="1" /> <edge from-layer="6210" from-port="2" to-layer="6219" to-port="0" /> <edge from-layer="6211" from-port="2" to-layer="6212" to-port="0" /> <edge from-layer="6212" from-port="2" to-layer="6214" to-port="0" /> <edge from-layer="6213" from-port="0" to-layer="6214" to-port="1" /> <edge from-layer="6214" from-port="2" to-layer="6219" to-port="1" /> <edge from-layer="6215" from-port="2" to-layer="6216" to-port="0" /> <edge from-layer="6216" from-port="2" to-layer="6218" to-port="0" /> <edge from-layer="6217" from-port="0" to-layer="6218" to-port="1" /> <edge from-layer="6218" from-port="2" to-layer="6219" to-port="2" /> <edge from-layer="6219" from-port="4" to-layer="6221" to-port="0" /> <edge from-layer="6220" from-port="0" to-layer="6221" to-port="1" /> <edge from-layer="6221" from-port="2" to-layer="6222" to-port="0" /> <edge from-layer="6222" from-port="2" to-layer="6231" to-port="0" /> <edge from-layer="6223" from-port="0" to-layer="6224" to-port="0" /> <edge from-layer="6224" from-port="1" to-layer="6227" to-port="0" /> <edge from-layer="6225" from-port="0" to-layer="6226" to-port="0" /> <edge from-layer="6226" from-port="1" to-layer="6227" to-port="1" /> <edge from-layer="6227" from-port="2" to-layer="6229" to-port="0" /> <edge from-layer="6228" from-port="0" to-layer="6229" to-port="1" /> <edge from-layer="6229" from-port="2" to-layer="6230" to-port="0" /> <edge from-layer="6230" from-port="1" to-layer="6231" to-port="1" /> <edge from-layer="6231" from-port="2" to-layer="6232" to-port="1" /> <edge from-layer="6232" from-port="2" to-layer="6274" to-port="0" /> <edge from-layer="6232" from-port="2" to-layer="6236" to-port="0" /> <edge from-layer="6232" from-port="2" to-layer="6243" to-port="0" /> <edge from-layer="6233" from-port="0" to-layer="6244" to-port="0" /> <edge from-layer="6234" from-port="0" to-layer="6242" to-port="0" /> <edge from-layer="6235" from-port="0" to-layer="6236" to-port="1" /> <edge from-layer="6236" from-port="2" to-layer="6238" to-port="0" /> <edge from-layer="6237" from-port="0" to-layer="6238" to-port="1" /> <edge from-layer="6238" from-port="2" to-layer="6240" to-port="0" /> <edge from-layer="6239" from-port="0" to-layer="6240" to-port="1" /> <edge from-layer="6240" from-port="2" to-layer="6241" to-port="0" /> <edge from-layer="6241" from-port="1" to-layer="6242" to-port="1" /> <edge from-layer="6242" from-port="2" to-layer="6243" to-port="1" /> <edge from-layer="6243" from-port="2" to-layer="6244" to-port="1" /> <edge from-layer="6244" from-port="2" to-layer="6263" to-port="0" /> <edge from-layer="6244" from-port="2" to-layer="6253" to-port="0" /> <edge from-layer="6245" from-port="0" to-layer="6246" to-port="0" /> <edge from-layer="6246" from-port="1" to-layer="6249" to-port="0" /> <edge from-layer="6247" from-port="0" to-layer="6248" to-port="0" /> <edge from-layer="6248" from-port="1" to-layer="6249" to-port="1" /> <edge from-layer="6249" from-port="2" to-layer="6251" to-port="0" /> <edge from-layer="6250" from-port="0" to-layer="6251" to-port="1" /> <edge from-layer="6251" from-port="2" to-layer="6252" to-port="0" /> <edge from-layer="6252" from-port="1" to-layer="6253" to-port="1" /> <edge from-layer="6253" from-port="2" to-layer="6254" to-port="0" /> <edge from-layer="6254" from-port="1" to-layer="6264" to-port="0" /> <edge from-layer="6255" from-port="0" to-layer="6256" to-port="0" /> <edge from-layer="6256" from-port="1" to-layer="6259" to-port="0" /> <edge from-layer="6257" from-port="0" to-layer="6258" to-port="0" /> <edge from-layer="6258" from-port="1" to-layer="6259" to-port="1" /> <edge from-layer="6259" from-port="2" to-layer="6261" to-port="0" /> <edge from-layer="6260" from-port="0" to-layer="6261" to-port="1" /> <edge from-layer="6261" from-port="2" to-layer="6262" to-port="0" /> <edge from-layer="6262" from-port="1" to-layer="6263" to-port="1" /> <edge from-layer="6263" from-port="2" to-layer="6264" to-port="1" /> <edge from-layer="6264" from-port="2" to-layer="6273" to-port="0" /> <edge from-layer="6265" from-port="0" to-layer="6266" to-port="0" /> <edge from-layer="6266" from-port="1" to-layer="6269" to-port="0" /> <edge from-layer="6267" from-port="0" to-layer="6268" to-port="0" /> <edge from-layer="6268" from-port="1" to-layer="6269" to-port="1" /> <edge from-layer="6269" from-port="2" to-layer="6271" to-port="0" /> <edge from-layer="6270" from-port="0" to-layer="6271" to-port="1" /> <edge from-layer="6271" from-port="2" to-layer="6272" to-port="0" /> <edge from-layer="6272" from-port="1" to-layer="6273" to-port="1" /> <edge from-layer="6273" from-port="2" to-layer="6274" to-port="1" /> <edge from-layer="6274" from-port="2" to-layer="6277" to-port="0" /> <edge from-layer="6274" from-port="2" to-layer="6284" to-port="0" /> <edge from-layer="6275" from-port="0" to-layer="6283" to-port="0" /> <edge from-layer="6276" from-port="0" to-layer="6277" to-port="1" /> <edge from-layer="6277" from-port="2" to-layer="6279" to-port="0" /> <edge from-layer="6278" from-port="0" to-layer="6279" to-port="1" /> <edge from-layer="6279" from-port="2" to-layer="6281" to-port="0" /> <edge from-layer="6280" from-port="0" to-layer="6281" to-port="1" /> <edge from-layer="6281" from-port="2" to-layer="6282" to-port="0" /> <edge from-layer="6282" from-port="1" to-layer="6283" to-port="1" /> <edge from-layer="6283" from-port="2" to-layer="6284" to-port="1" /> <edge from-layer="6284" from-port="2" to-layer="6285" to-port="1" /> <edge from-layer="6285" from-port="2" to-layer="6294" to-port="0" /> <edge from-layer="6286" from-port="0" to-layer="6287" to-port="0" /> <edge from-layer="6287" from-port="1" to-layer="6290" to-port="0" /> <edge from-layer="6288" from-port="0" to-layer="6289" to-port="0" /> <edge from-layer="6289" from-port="1" to-layer="6290" to-port="1" /> <edge from-layer="6290" from-port="2" to-layer="6292" to-port="0" /> <edge from-layer="6291" from-port="0" to-layer="6292" to-port="1" /> <edge from-layer="6292" from-port="2" to-layer="6293" to-port="0" /> <edge from-layer="6293" from-port="1" to-layer="6294" to-port="1" /> <edge from-layer="6294" from-port="2" to-layer="6295" to-port="0" /> </edges> <rt_info> <Runtime_version value="2025.0.0-17720-1ec91fc6b64" /> <conversion_parameters> <framework value="pytorch" /> <is_python_object value="True" /> </conversion_parameters> <nncf> <friendly_names_were_updated value="True" /> <weight_compression> <advanced_parameters value="{'statistics_path': None, 'awq_params': {'subset_size': 32, 'percent_to_apply': 0.002, 'alpha_min': 0.0, 'alpha_max': 1.0, 'steps': 100}, 'scale_estimation_params': {'subset_size': 64, 'initial_steps': 5, 'scale_steps': 5, 'weight_penalty': -1.0}, 'gptq_params': {'damp_percent': 0.1, 'block_size': 128, 'subset_size': 128}, 'lora_correction_params': {'adapter_rank': 8, 'num_iterations': 3, 'apply_regularization': True, 'subset_size': 128, 'use_int8_adapters': True}}" /> <all_layers value="False" /> <awq value="False" /> <backup_mode value="int8_asym" /> <gptq value="False" /> <group_size value="-1" /> <ignored_scope value="[]" /> <lora_correction value="False" /> <mode value="int8_asym" /> <ratio value="1.0" /> <scale_estimation value="False" /> <sensitivity_metric value="weight_quantization_error" /> </weight_compression> </nncf> <optimum> <optimum_intel_version value="1.22.0.dev0+014a840" /> <optimum_version value="1.24.0.dev0" /> <pytorch_version value="2.4.1+cpu" /> <transformers_version value="4.47.1" /> </optimum> <runtime_options> <ACTIVATIONS_SCALE_FACTOR value="8.0" /> <KV_CACHE_PRECISION value="f16" /> </runtime_options> </rt_info> </net>