diff --git "a/openvino/openvino_model.xml" "b/openvino/openvino_model.xml" new file mode 100644--- /dev/null +++ "b/openvino/openvino_model.xml" @@ -0,0 +1,12168 @@ +<?xml version="1.0"?> +<net name="Model4940" version="11"> + <layers> + <layer id="2" name="input_ids" type="Parameter" version="opset1"> + <data shape="?,?" element_type="i64" /> + <output> + <port id="0" precision="I64" names="input_ids"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1" name="attention_mask" type="Parameter" version="opset1"> + <data shape="?,?" element_type="i64" /> + <output> + <port id="0" precision="I64" names="attention_mask"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="0" name="token_type_ids" type="Parameter" version="opset1"> + <data shape="?,?" element_type="i64" /> + <output> + <port id="0" precision="I64" names="token_type_ids"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3" name="self.embeddings.word_embeddings.weight" type="Const" version="opset1"> + <data element_type="f32" shape="21128, 768" offset="0" size="64905216" /> + <output> + <port id="0" precision="FP32" names="self.embeddings.word_embeddings.weight"> + <dim>21128</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="4" name="__module.embeddings.word_embeddings/aten::embedding/Convert" type="Convert" version="opset1"> + <data destination_type="i32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5" name="__module.embeddings.word_embeddings/aten::embedding/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="64905216" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6" name="__module.embeddings.word_embeddings/aten::embedding/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>21128</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="79,inputs_embeds"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="7" name="self.embeddings.token_type_embeddings.weight" type="Const" version="opset1"> + <data element_type="f32" shape="2, 768" offset="64905220" size="6144" /> + <output> + <port id="0" precision="FP32" names="self.embeddings.token_type_embeddings.weight"> + <dim>2</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="8" name="__module.embeddings.token_type_embeddings/aten::embedding/Convert" type="Convert" version="opset1"> + <data destination_type="i32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="9" name="__module.embeddings.token_type_embeddings/aten::embedding/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="64905216" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10" name="__module.embeddings.token_type_embeddings/aten::embedding/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>2</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="81,token_type_embeddings.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="11" name="__module.embeddings/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="82_1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="12" name="self.embeddings.position_embeddings.weight" type="Const" version="opset1"> + <data element_type="f32" shape="512, 768" offset="64911364" size="1572864" /> + <output> + <port id="0" precision="FP32" names="self.embeddings.position_embeddings.weight"> + <dim>512</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="13" name="__module.embeddings/aten::slice/Slice" type="Const" version="opset1"> + <data element_type="i64" shape="1, 512" offset="66484228" size="4096" /> + <output> + <port id="0" precision="I64" names="76"> + <dim>1</dim> + <dim>512</dim> + </port> + </output> + </layer> + <layer id="14" name="__module.embeddings/aten::slice/Reshape" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="66488324" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="15" name="ShapeOf_4461957" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="16" name="Constant_4462085" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="66488332" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="17" name="Constant_4461959" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="66488324" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="18" name="Gather_4461960" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="10,17,19,72,74,75,8"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="19" name="__module.embeddings/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="66488332" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="20" name="__module.embeddings/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="66488332" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="21" name="__module.embeddings/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + <dim>512</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="I64" names="77"> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="22" name="__module.embeddings.position_embeddings/aten::embedding/Convert" type="Convert" version="opset1"> + <data destination_type="i32" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I32"> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="23" name="__module.embeddings.position_embeddings/aten::embedding/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="64905216" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="24" name="__module.embeddings.position_embeddings/aten::embedding/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>512</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="84,position_embeddings.1"> + <dim>1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="25" name="__module.embeddings/aten::add_/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="82,embeddings.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="26" name="__module.embeddings.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="27" name="__module.embeddings.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="28" name="Constant_4461730" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="66488344" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="29" name="__module.embeddings.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="30" name="Constant_4461731" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="66491416" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="31" name="__module.embeddings.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="89,input.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="32" name="self.encoder.layer.0.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="66494488" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.0.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="33" name="__module.encoder.layer.0.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="34" name="Constant_4461732" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="68853784" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="35" name="__module.encoder.layer.0.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="141,x.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="36" name="__module.encoder.layer.0.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="37" name="__module.encoder.layer.0.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="145,x.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="38" name="Constant_4452609" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="146"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="39" name="__module.encoder.layer.0.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="147"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="40" name="self.encoder.layer.0.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="68856920" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.0.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="41" name="__module.encoder.layer.0.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="42" name="Constant_4461733" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="71216216" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="43" name="__module.encoder.layer.0.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="150,x.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="44" name="__module.encoder.layer.0.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="45" name="__module.encoder.layer.0.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="154,x.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="46" name="Constant_4452634" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="155"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="47" name="__module.encoder.layer.0.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="156"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="48" name="self.encoder.layer.0.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="71219288" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.0.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="49" name="__module.encoder.layer.0.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="50" name="Constant_4461734" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="73578584" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="51" name="__module.encoder.layer.0.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="159,x.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="52" name="__module.encoder.layer.0.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="53" name="__module.encoder.layer.0.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="163,x.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="54" name="Constant_4452659" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="164"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="55" name="__module.encoder.layer.0.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="165"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="56" name="Constant_4461736" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="73581656" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="57" name="25" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="66488332" size="8" /> + <output> + <port id="0" precision="I64" names="25" /> + </output> + </layer> + <layer id="58" name="aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="26"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="59" name="27" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="73581660" size="8" /> + <output> + <port id="0" precision="I64" names="27" /> + </output> + </layer> + <layer id="60" name="aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="28,33"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="61" name="Constant_4462088" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="66488324" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="62" name="Constant_4461967" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="66488324" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="63" name="Gather_4461968" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="13,15"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="64" name="Constant_4460354" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="66488332" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="65" name="Constant_4462090" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="73581668" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="66" name="Constant_4462091" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="66488324" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="67" name="Gather_4462092" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="68" name="prim::ListConstruct/Concat" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="35"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="69" name="aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="37"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="70" name="aten::to/Convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="42"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="71" name="Constant_4461735" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="73581656" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="72" name="aten::rsub/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="73" name="aten::rsub/Subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="45,inverted_mask"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="74" name="aten::to/Convert_1" type="Convert" version="opset1"> + <data destination_type="boolean" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="BOOL" names="50"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="75" name="aten::masked_fill/ConvertLike" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="73581684" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="76" name="aten::masked_fill/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="3" precision="FP32" names="52"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="77" name="__module.encoder.layer.0.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="166,attn_output.1"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="78" name="__module.encoder.layer.0.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="79" name="__module.encoder.layer.0.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="167,attn_output.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="80" name="Constant_4461976" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="81" name="__module.encoder.layer.0.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="169"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="82" name="self.encoder.layer.0.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="73581728" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.0.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="83" name="__module.encoder.layer.0.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="84" name="Constant_4461737" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="75941024" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="85" name="__module.encoder.layer.0.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="175,input.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="86" name="__module.encoder.layer.0.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="177"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="87" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="88" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="89" name="Constant_4461738" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="75944096" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="90" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="91" name="Constant_4461739" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="75947168" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="92" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="181,input_tensor.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="93" name="self.encoder.layer.0.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="75950240" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.0.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="94" name="__module.encoder.layer.0.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="95" name="Constant_4461740" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="85387424" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="96" name="__module.encoder.layer.0.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="186"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="97" name="__module.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="187"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="98" name="self.encoder.layer.0.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="85399712" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.0.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="99" name="__module.encoder.layer.0.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="100" name="Constant_4461741" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="94836896" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="101" name="__module.encoder.layer.0.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="193,input.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="102" name="__module.encoder.layer.0.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="195"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="103" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="104" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="105" name="Constant_4461742" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="94839968" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="106" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="107" name="Constant_4461743" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="94843040" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="108" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="199,hidden_states.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="109" name="self.encoder.layer.1.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="94846112" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.1.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="110" name="__module.encoder.layer.1.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="111" name="Constant_4461744" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="97205408" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="112" name="__module.encoder.layer.1.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="212,x.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="113" name="__module.encoder.layer.1.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="114" name="__module.encoder.layer.1.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="216,x.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="115" name="Constant_4452841" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="217"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="116" name="__module.encoder.layer.1.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="218"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="117" name="self.encoder.layer.1.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="97208480" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.1.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="118" name="__module.encoder.layer.1.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="119" name="Constant_4461745" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="99567776" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="120" name="__module.encoder.layer.1.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="221,x.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="121" name="__module.encoder.layer.1.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="122" name="__module.encoder.layer.1.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="225,x.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="123" name="Constant_4452864" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="226"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="124" name="__module.encoder.layer.1.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="227"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="125" name="self.encoder.layer.1.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="99570848" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.1.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="126" name="__module.encoder.layer.1.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="127" name="Constant_4461746" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="101930144" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="128" name="__module.encoder.layer.1.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="230,x.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="129" name="__module.encoder.layer.1.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="130" name="__module.encoder.layer.1.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="234,x.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="131" name="Constant_4452887" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="235"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="132" name="__module.encoder.layer.1.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="236"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="133" name="__module.encoder.layer.1.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="237,attn_output.5"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="134" name="__module.encoder.layer.1.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="135" name="__module.encoder.layer.1.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="238,attn_output.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="136" name="Constant_4461977" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="137" name="__module.encoder.layer.1.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="240"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="138" name="self.encoder.layer.1.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="101933216" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.1.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="139" name="__module.encoder.layer.1.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="140" name="Constant_4461747" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="104292512" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="141" name="__module.encoder.layer.1.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="246,input.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="142" name="__module.encoder.layer.1.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="248"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="143" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="144" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="145" name="Constant_4461748" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="104295584" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="146" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="147" name="Constant_4461749" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="104298656" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="148" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="252,input_tensor.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="149" name="self.encoder.layer.1.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="104301728" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.1.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="150" name="__module.encoder.layer.1.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="151" name="Constant_4461750" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="113738912" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="152" name="__module.encoder.layer.1.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="257"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="153" name="__module.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="258"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="154" name="self.encoder.layer.1.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="113751200" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.1.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="155" name="__module.encoder.layer.1.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="156" name="Constant_4461751" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="123188384" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="157" name="__module.encoder.layer.1.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="264,input.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="158" name="__module.encoder.layer.1.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="266"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="159" name="__module.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="160" name="__module.encoder.layer.1.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="161" name="Constant_4461752" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="123191456" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="162" name="__module.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="163" name="Constant_4461753" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="123194528" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="164" name="__module.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="270,hidden_states.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="165" name="self.encoder.layer.2.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="123197600" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.2.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="166" name="__module.encoder.layer.2.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="167" name="Constant_4461754" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="125556896" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="168" name="__module.encoder.layer.2.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="283,x.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="169" name="__module.encoder.layer.2.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="170" name="__module.encoder.layer.2.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="287,x.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="171" name="Constant_4453067" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="288"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="172" name="__module.encoder.layer.2.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="289"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="173" name="self.encoder.layer.2.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="125559968" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.2.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="174" name="__module.encoder.layer.2.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="175" name="Constant_4461755" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="127919264" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="176" name="__module.encoder.layer.2.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="292,x.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="177" name="__module.encoder.layer.2.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="178" name="__module.encoder.layer.2.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="296,x.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="179" name="Constant_4453090" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="297"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="180" name="__module.encoder.layer.2.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="298"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="181" name="self.encoder.layer.2.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="127922336" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.2.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="182" name="__module.encoder.layer.2.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="183" name="Constant_4461756" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="130281632" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="184" name="__module.encoder.layer.2.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="301,x.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="185" name="__module.encoder.layer.2.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="186" name="__module.encoder.layer.2.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="305,x.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="187" name="Constant_4453113" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="306"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="188" name="__module.encoder.layer.2.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="307"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="189" name="__module.encoder.layer.2.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="308,attn_output.9"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="190" name="__module.encoder.layer.2.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="191" name="__module.encoder.layer.2.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="309,attn_output.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="192" name="Constant_4461978" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="193" name="__module.encoder.layer.2.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="311"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="194" name="self.encoder.layer.2.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="130284704" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.2.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="195" name="__module.encoder.layer.2.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="196" name="Constant_4461757" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="132644000" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="197" name="__module.encoder.layer.2.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="317,input.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="198" name="__module.encoder.layer.2.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="319"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="199" name="__module.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="200" name="__module.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="201" name="Constant_4461758" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="132647072" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="202" name="__module.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="203" name="Constant_4461759" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="132650144" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="204" name="__module.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="323,input_tensor.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="205" name="self.encoder.layer.2.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="132653216" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.2.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="206" name="__module.encoder.layer.2.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="207" name="Constant_4461760" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="142090400" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="208" name="__module.encoder.layer.2.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="328"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="209" name="__module.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="329"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="210" name="self.encoder.layer.2.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="142102688" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.2.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="211" name="__module.encoder.layer.2.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="212" name="Constant_4461761" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="151539872" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="213" name="__module.encoder.layer.2.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="335,input.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="214" name="__module.encoder.layer.2.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="337"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="215" name="__module.encoder.layer.2.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="216" name="__module.encoder.layer.2.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="217" name="Constant_4461762" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="151542944" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="218" name="__module.encoder.layer.2.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="219" name="Constant_4461763" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="151546016" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="220" name="__module.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="341,hidden_states.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="221" name="self.encoder.layer.3.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="151549088" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.3.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="222" name="__module.encoder.layer.3.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="223" name="Constant_4461764" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="153908384" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="224" name="__module.encoder.layer.3.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="354,x.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="225" name="__module.encoder.layer.3.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="226" name="__module.encoder.layer.3.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="358,x.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="227" name="Constant_4453293" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="359"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="228" name="__module.encoder.layer.3.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="360"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="229" name="self.encoder.layer.3.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="153911456" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.3.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="230" name="__module.encoder.layer.3.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="231" name="Constant_4461765" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="156270752" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="232" name="__module.encoder.layer.3.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="363,x.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="233" name="__module.encoder.layer.3.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="234" name="__module.encoder.layer.3.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="367,x.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="235" name="Constant_4453316" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="368"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="236" name="__module.encoder.layer.3.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="369"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="237" name="self.encoder.layer.3.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="156273824" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.3.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="238" name="__module.encoder.layer.3.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="239" name="Constant_4461766" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="158633120" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="240" name="__module.encoder.layer.3.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="372,x.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="241" name="__module.encoder.layer.3.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="242" name="__module.encoder.layer.3.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="376,x.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="243" name="Constant_4453339" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="377"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="244" name="__module.encoder.layer.3.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="378"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="245" name="__module.encoder.layer.3.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="379,attn_output.13"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="246" name="__module.encoder.layer.3.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="247" name="__module.encoder.layer.3.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="380,attn_output.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="248" name="Constant_4461979" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="249" name="__module.encoder.layer.3.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="382"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="250" name="self.encoder.layer.3.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="158636192" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.3.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="251" name="__module.encoder.layer.3.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="252" name="Constant_4461767" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="160995488" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="253" name="__module.encoder.layer.3.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="388,input.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="254" name="__module.encoder.layer.3.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="390"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="255" name="__module.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="256" name="__module.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="257" name="Constant_4461768" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="160998560" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="258" name="__module.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="259" name="Constant_4461769" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="161001632" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="260" name="__module.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="394,input_tensor.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="261" name="self.encoder.layer.3.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="161004704" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.3.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="262" name="__module.encoder.layer.3.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="263" name="Constant_4461770" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="170441888" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="264" name="__module.encoder.layer.3.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="399"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="265" name="__module.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="400"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="266" name="self.encoder.layer.3.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="170454176" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.3.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="267" name="__module.encoder.layer.3.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="268" name="Constant_4461771" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="179891360" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="269" name="__module.encoder.layer.3.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="406,input.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="270" name="__module.encoder.layer.3.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="408"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="271" name="__module.encoder.layer.3.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="272" name="__module.encoder.layer.3.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="273" name="Constant_4461772" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="179894432" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="274" name="__module.encoder.layer.3.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="275" name="Constant_4461773" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="179897504" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="276" name="__module.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="412,hidden_states.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="277" name="self.encoder.layer.4.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="179900576" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.4.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="278" name="__module.encoder.layer.4.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="279" name="Constant_4461774" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="182259872" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="280" name="__module.encoder.layer.4.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="425,x.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="281" name="__module.encoder.layer.4.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="282" name="__module.encoder.layer.4.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="429,x.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="283" name="Constant_4453519" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="430"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="284" name="__module.encoder.layer.4.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="431"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="285" name="self.encoder.layer.4.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="182262944" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.4.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="286" name="__module.encoder.layer.4.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="287" name="Constant_4461775" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="184622240" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="288" name="__module.encoder.layer.4.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="434,x.53"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="289" name="__module.encoder.layer.4.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="290" name="__module.encoder.layer.4.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="438,x.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="291" name="Constant_4453542" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="439"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="292" name="__module.encoder.layer.4.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="440"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="293" name="self.encoder.layer.4.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="184625312" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.4.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="294" name="__module.encoder.layer.4.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="295" name="Constant_4461776" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="186984608" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="296" name="__module.encoder.layer.4.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="443,x.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="297" name="__module.encoder.layer.4.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="298" name="__module.encoder.layer.4.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="447,x.59"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="299" name="Constant_4453565" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="448"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="300" name="__module.encoder.layer.4.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="449"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="301" name="__module.encoder.layer.4.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="450,attn_output.17"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="302" name="__module.encoder.layer.4.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="303" name="__module.encoder.layer.4.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="451,attn_output.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="304" name="Constant_4461980" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="305" name="__module.encoder.layer.4.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="453"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="306" name="self.encoder.layer.4.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="186987680" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.4.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="307" name="__module.encoder.layer.4.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="308" name="Constant_4461777" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="189346976" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="309" name="__module.encoder.layer.4.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="459,input.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="310" name="__module.encoder.layer.4.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="461"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="311" name="__module.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="312" name="__module.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="313" name="Constant_4461778" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="189350048" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="314" name="__module.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="315" name="Constant_4461779" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="189353120" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="316" name="__module.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="465,input_tensor.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="317" name="self.encoder.layer.4.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="189356192" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.4.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="318" name="__module.encoder.layer.4.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="319" name="Constant_4461780" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="198793376" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="320" name="__module.encoder.layer.4.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="470"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="321" name="__module.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="471"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="322" name="self.encoder.layer.4.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="198805664" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.4.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="323" name="__module.encoder.layer.4.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="324" name="Constant_4461781" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="208242848" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="325" name="__module.encoder.layer.4.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="477,input.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="326" name="__module.encoder.layer.4.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="479"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="327" name="__module.encoder.layer.4.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="328" name="__module.encoder.layer.4.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="329" name="Constant_4461782" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="208245920" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="330" name="__module.encoder.layer.4.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="331" name="Constant_4461783" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="208248992" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="332" name="__module.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="483,hidden_states.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="333" name="self.encoder.layer.5.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="208252064" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.5.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="334" name="__module.encoder.layer.5.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="335" name="Constant_4461784" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="210611360" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="336" name="__module.encoder.layer.5.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="496,x.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="337" name="__module.encoder.layer.5.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="338" name="__module.encoder.layer.5.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="500,x.63"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="339" name="Constant_4453745" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="501"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="340" name="__module.encoder.layer.5.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="502"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="341" name="self.encoder.layer.5.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="210614432" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.5.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="342" name="__module.encoder.layer.5.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="343" name="Constant_4461785" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="212973728" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="344" name="__module.encoder.layer.5.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="505,x.65"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="345" name="__module.encoder.layer.5.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="346" name="__module.encoder.layer.5.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="509,x.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="347" name="Constant_4453768" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="510"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="348" name="__module.encoder.layer.5.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="511"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="349" name="self.encoder.layer.5.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="212976800" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.5.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="350" name="__module.encoder.layer.5.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="351" name="Constant_4461786" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="215336096" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="352" name="__module.encoder.layer.5.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="514,x.69"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="353" name="__module.encoder.layer.5.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="354" name="__module.encoder.layer.5.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="518,x.71"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="355" name="Constant_4453791" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="519"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="356" name="__module.encoder.layer.5.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="520"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="357" name="__module.encoder.layer.5.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="521,attn_output.21"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="358" name="__module.encoder.layer.5.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="359" name="__module.encoder.layer.5.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="522,attn_output.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="360" name="Constant_4461981" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="361" name="__module.encoder.layer.5.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="524"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="362" name="self.encoder.layer.5.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="215339168" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.5.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="363" name="__module.encoder.layer.5.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="364" name="Constant_4461787" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="217698464" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="365" name="__module.encoder.layer.5.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="530,input.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="366" name="__module.encoder.layer.5.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="532"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="367" name="__module.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="368" name="__module.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="369" name="Constant_4461788" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="217701536" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="370" name="__module.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="371" name="Constant_4461789" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="217704608" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="372" name="__module.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="536,input_tensor.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="373" name="self.encoder.layer.5.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="217707680" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.5.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="374" name="__module.encoder.layer.5.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="375" name="Constant_4461790" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="227144864" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="376" name="__module.encoder.layer.5.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="541"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="377" name="__module.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="542"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="378" name="self.encoder.layer.5.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="227157152" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.5.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="379" name="__module.encoder.layer.5.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="380" name="Constant_4461791" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="236594336" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="381" name="__module.encoder.layer.5.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="548,input.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="382" name="__module.encoder.layer.5.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="550"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="383" name="__module.encoder.layer.5.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="384" name="__module.encoder.layer.5.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="385" name="Constant_4461792" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="236597408" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="386" name="__module.encoder.layer.5.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="387" name="Constant_4461793" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="236600480" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="388" name="__module.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="554,hidden_states.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="389" name="self.encoder.layer.6.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="236603552" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.6.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="390" name="__module.encoder.layer.6.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="391" name="Constant_4461794" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="238962848" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="392" name="__module.encoder.layer.6.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="567,x.73"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="393" name="__module.encoder.layer.6.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="394" name="__module.encoder.layer.6.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="571,x.75"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="395" name="Constant_4453971" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="572"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="396" name="__module.encoder.layer.6.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="573"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="397" name="self.encoder.layer.6.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="238965920" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.6.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="398" name="__module.encoder.layer.6.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="399" name="Constant_4461795" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="241325216" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="400" name="__module.encoder.layer.6.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="576,x.77"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="401" name="__module.encoder.layer.6.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="402" name="__module.encoder.layer.6.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="580,x.79"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="403" name="Constant_4453994" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="581"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="404" name="__module.encoder.layer.6.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="582"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="405" name="self.encoder.layer.6.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="241328288" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.6.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="406" name="__module.encoder.layer.6.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="407" name="Constant_4461796" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="243687584" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="408" name="__module.encoder.layer.6.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="585,x.81"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="409" name="__module.encoder.layer.6.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="410" name="__module.encoder.layer.6.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="589,x.83"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="411" name="Constant_4454017" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="590"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="412" name="__module.encoder.layer.6.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="591"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="413" name="__module.encoder.layer.6.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="592,attn_output.25"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="414" name="__module.encoder.layer.6.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="415" name="__module.encoder.layer.6.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="593,attn_output.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="416" name="Constant_4461982" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="417" name="__module.encoder.layer.6.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="595"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="418" name="self.encoder.layer.6.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="243690656" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.6.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="419" name="__module.encoder.layer.6.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="420" name="Constant_4461797" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="246049952" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="421" name="__module.encoder.layer.6.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="601,input.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="422" name="__module.encoder.layer.6.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="603"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="423" name="__module.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="424" name="__module.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="425" name="Constant_4461798" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="246053024" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="426" name="__module.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="427" name="Constant_4461799" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="246056096" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="428" name="__module.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="607,input_tensor.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="429" name="self.encoder.layer.6.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="246059168" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.6.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="430" name="__module.encoder.layer.6.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="431" name="Constant_4461800" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="255496352" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="432" name="__module.encoder.layer.6.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="612"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="433" name="__module.encoder.layer.6.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="613"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="434" name="self.encoder.layer.6.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="255508640" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.6.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="435" name="__module.encoder.layer.6.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="436" name="Constant_4461801" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="264945824" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="437" name="__module.encoder.layer.6.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="619,input.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="438" name="__module.encoder.layer.6.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="621"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="439" name="__module.encoder.layer.6.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="440" name="__module.encoder.layer.6.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="441" name="Constant_4461802" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="264948896" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="442" name="__module.encoder.layer.6.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="443" name="Constant_4461803" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="264951968" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="444" name="__module.encoder.layer.6.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="625,hidden_states.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="445" name="self.encoder.layer.7.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="264955040" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.7.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="446" name="__module.encoder.layer.7.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="447" name="Constant_4461804" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="267314336" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="448" name="__module.encoder.layer.7.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="638,x.85"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="449" name="__module.encoder.layer.7.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="450" name="__module.encoder.layer.7.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="642,x.87"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="451" name="Constant_4454197" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="643"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="452" name="__module.encoder.layer.7.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="644"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="453" name="self.encoder.layer.7.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="267317408" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.7.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="454" name="__module.encoder.layer.7.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="455" name="Constant_4461805" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="269676704" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="456" name="__module.encoder.layer.7.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="647,x.89"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="457" name="__module.encoder.layer.7.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="458" name="__module.encoder.layer.7.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="651,x.91"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="459" name="Constant_4454220" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="652"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="460" name="__module.encoder.layer.7.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="653"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="461" name="self.encoder.layer.7.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="269679776" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.7.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="462" name="__module.encoder.layer.7.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="463" name="Constant_4461806" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="272039072" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="464" name="__module.encoder.layer.7.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="656,x.93"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="465" name="__module.encoder.layer.7.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="466" name="__module.encoder.layer.7.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="660,x.95"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="467" name="Constant_4454243" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="661"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="468" name="__module.encoder.layer.7.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="662"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="469" name="__module.encoder.layer.7.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="663,attn_output.29"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="470" name="__module.encoder.layer.7.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="471" name="__module.encoder.layer.7.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="664,attn_output.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="472" name="Constant_4461983" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="473" name="__module.encoder.layer.7.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="666"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="474" name="self.encoder.layer.7.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="272042144" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.7.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="475" name="__module.encoder.layer.7.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="476" name="Constant_4461807" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="274401440" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="477" name="__module.encoder.layer.7.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="672,input.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="478" name="__module.encoder.layer.7.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="674"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="479" name="__module.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="480" name="__module.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="481" name="Constant_4461808" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="274404512" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="482" name="__module.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="483" name="Constant_4461809" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="274407584" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="484" name="__module.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="678,input_tensor.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="485" name="self.encoder.layer.7.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="274410656" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.7.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="486" name="__module.encoder.layer.7.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="487" name="Constant_4461810" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="283847840" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="488" name="__module.encoder.layer.7.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="683"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="489" name="__module.encoder.layer.7.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="684"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="490" name="self.encoder.layer.7.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="283860128" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.7.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="491" name="__module.encoder.layer.7.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="492" name="Constant_4461811" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="293297312" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="493" name="__module.encoder.layer.7.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="690,input.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="494" name="__module.encoder.layer.7.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="692"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="495" name="__module.encoder.layer.7.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="496" name="__module.encoder.layer.7.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="497" name="Constant_4461812" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="293300384" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="498" name="__module.encoder.layer.7.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="499" name="Constant_4461813" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="293303456" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="500" name="__module.encoder.layer.7.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="696,hidden_states.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="501" name="self.encoder.layer.8.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="293306528" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.8.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="502" name="__module.encoder.layer.8.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="503" name="Constant_4461814" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="295665824" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="504" name="__module.encoder.layer.8.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="709,x.97"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="505" name="__module.encoder.layer.8.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="506" name="__module.encoder.layer.8.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="713,x.99"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="507" name="Constant_4454423" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="714"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="508" name="__module.encoder.layer.8.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="715"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="509" name="self.encoder.layer.8.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="295668896" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.8.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="510" name="__module.encoder.layer.8.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="511" name="Constant_4461815" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="298028192" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="512" name="__module.encoder.layer.8.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="718,x.101"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="513" name="__module.encoder.layer.8.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="514" name="__module.encoder.layer.8.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="722,x.103"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="515" name="Constant_4454446" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="723"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="516" name="__module.encoder.layer.8.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="724"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="517" name="self.encoder.layer.8.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="298031264" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.8.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="518" name="__module.encoder.layer.8.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="519" name="Constant_4461816" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="300390560" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="520" name="__module.encoder.layer.8.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="727,x.105"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="521" name="__module.encoder.layer.8.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="522" name="__module.encoder.layer.8.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="731,x.107"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="523" name="Constant_4454469" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="732"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="524" name="__module.encoder.layer.8.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="733"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="525" name="__module.encoder.layer.8.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="734,attn_output.33"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="526" name="__module.encoder.layer.8.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="527" name="__module.encoder.layer.8.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="735,attn_output.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="528" name="Constant_4461984" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="529" name="__module.encoder.layer.8.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="737"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="530" name="self.encoder.layer.8.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="300393632" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.8.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="531" name="__module.encoder.layer.8.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="532" name="Constant_4461817" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="302752928" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="533" name="__module.encoder.layer.8.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="743,input.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="534" name="__module.encoder.layer.8.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="745"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="535" name="__module.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="536" name="__module.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="537" name="Constant_4461818" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="302756000" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="538" name="__module.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="539" name="Constant_4461819" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="302759072" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="540" name="__module.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="749,input_tensor.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="541" name="self.encoder.layer.8.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="302762144" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.8.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="542" name="__module.encoder.layer.8.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="543" name="Constant_4461820" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="312199328" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="544" name="__module.encoder.layer.8.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="754"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="545" name="__module.encoder.layer.8.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="755"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="546" name="self.encoder.layer.8.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="312211616" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.8.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="547" name="__module.encoder.layer.8.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="548" name="Constant_4461821" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="321648800" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="549" name="__module.encoder.layer.8.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="761,input.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="550" name="__module.encoder.layer.8.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="763"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="551" name="__module.encoder.layer.8.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="552" name="__module.encoder.layer.8.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="553" name="Constant_4461822" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="321651872" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="554" name="__module.encoder.layer.8.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="555" name="Constant_4461823" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="321654944" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="556" name="__module.encoder.layer.8.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="767,hidden_states.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="557" name="self.encoder.layer.9.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="321658016" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.9.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="558" name="__module.encoder.layer.9.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="559" name="Constant_4461824" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="324017312" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="560" name="__module.encoder.layer.9.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="780,x.109"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="561" name="__module.encoder.layer.9.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="562" name="__module.encoder.layer.9.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="784,x.111"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="563" name="Constant_4454649" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="785"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="564" name="__module.encoder.layer.9.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="786"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="565" name="self.encoder.layer.9.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="324020384" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.9.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="566" name="__module.encoder.layer.9.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="567" name="Constant_4461825" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="326379680" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="568" name="__module.encoder.layer.9.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="789,x.113"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="569" name="__module.encoder.layer.9.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="570" name="__module.encoder.layer.9.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="793,x.115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="571" name="Constant_4454672" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="794"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="572" name="__module.encoder.layer.9.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="795"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="573" name="self.encoder.layer.9.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="326382752" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.9.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="574" name="__module.encoder.layer.9.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="575" name="Constant_4461826" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="328742048" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="576" name="__module.encoder.layer.9.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="798,x.117"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="577" name="__module.encoder.layer.9.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="578" name="__module.encoder.layer.9.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="802,x.119"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="579" name="Constant_4454695" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="803"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="580" name="__module.encoder.layer.9.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="804"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="581" name="__module.encoder.layer.9.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="805,attn_output.37"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="582" name="__module.encoder.layer.9.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="583" name="__module.encoder.layer.9.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="806,attn_output.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="584" name="Constant_4461985" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="585" name="__module.encoder.layer.9.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="808"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="586" name="self.encoder.layer.9.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="328745120" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.9.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="587" name="__module.encoder.layer.9.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="588" name="Constant_4461827" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="331104416" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="589" name="__module.encoder.layer.9.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="814,input.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="590" name="__module.encoder.layer.9.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="816"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="591" name="__module.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="592" name="__module.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="593" name="Constant_4461828" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="331107488" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="594" name="__module.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="595" name="Constant_4461829" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="331110560" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="596" name="__module.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="820,input_tensor.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="597" name="self.encoder.layer.9.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="331113632" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.9.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="598" name="__module.encoder.layer.9.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="599" name="Constant_4461830" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="340550816" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="600" name="__module.encoder.layer.9.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="825"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="601" name="__module.encoder.layer.9.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="826"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="602" name="self.encoder.layer.9.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="340563104" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.9.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="603" name="__module.encoder.layer.9.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="604" name="Constant_4461831" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="350000288" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="605" name="__module.encoder.layer.9.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="832,input.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="606" name="__module.encoder.layer.9.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="834"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="607" name="__module.encoder.layer.9.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="608" name="__module.encoder.layer.9.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="609" name="Constant_4461832" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="350003360" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="610" name="__module.encoder.layer.9.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="611" name="Constant_4461833" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="350006432" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="612" name="__module.encoder.layer.9.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="838,hidden_states.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="613" name="self.encoder.layer.10.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="350009504" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.10.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="614" name="__module.encoder.layer.10.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="615" name="Constant_4461834" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="352368800" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="616" name="__module.encoder.layer.10.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="851,x.121"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="617" name="__module.encoder.layer.10.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="618" name="__module.encoder.layer.10.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="855,x.123"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="619" name="Constant_4454875" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="856"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="620" name="__module.encoder.layer.10.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="857"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="621" name="self.encoder.layer.10.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="352371872" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.10.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="622" name="__module.encoder.layer.10.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="623" name="Constant_4461835" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="354731168" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="624" name="__module.encoder.layer.10.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="860,x.125"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="625" name="__module.encoder.layer.10.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="626" name="__module.encoder.layer.10.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="864,x.127"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="627" name="Constant_4454898" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="865"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="628" name="__module.encoder.layer.10.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="866"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="629" name="self.encoder.layer.10.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="354734240" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.10.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="630" name="__module.encoder.layer.10.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="631" name="Constant_4461836" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="357093536" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="632" name="__module.encoder.layer.10.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="869,x.129"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="633" name="__module.encoder.layer.10.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="634" name="__module.encoder.layer.10.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="873,x.131"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="635" name="Constant_4454921" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="874"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="636" name="__module.encoder.layer.10.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="875"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="637" name="__module.encoder.layer.10.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="876,attn_output.41"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="638" name="__module.encoder.layer.10.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="639" name="__module.encoder.layer.10.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="877,attn_output.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="640" name="Constant_4461986" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="641" name="__module.encoder.layer.10.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="879"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="642" name="self.encoder.layer.10.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="357096608" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.10.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="643" name="__module.encoder.layer.10.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="644" name="Constant_4461837" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="359455904" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="645" name="__module.encoder.layer.10.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="885,input.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="646" name="__module.encoder.layer.10.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="887"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="647" name="__module.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="648" name="__module.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="649" name="Constant_4461838" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="359458976" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="650" name="__module.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="651" name="Constant_4461839" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="359462048" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="652" name="__module.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="891,input_tensor.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="653" name="self.encoder.layer.10.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="359465120" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.10.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="654" name="__module.encoder.layer.10.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="655" name="Constant_4461840" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="368902304" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="656" name="__module.encoder.layer.10.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="896"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="657" name="__module.encoder.layer.10.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="897"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="658" name="self.encoder.layer.10.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="368914592" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.10.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="659" name="__module.encoder.layer.10.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="660" name="Constant_4461841" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="378351776" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="661" name="__module.encoder.layer.10.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="903,input.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="662" name="__module.encoder.layer.10.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="905"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="663" name="__module.encoder.layer.10.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="664" name="__module.encoder.layer.10.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="665" name="Constant_4461842" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="378354848" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="666" name="__module.encoder.layer.10.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="667" name="Constant_4461843" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="378357920" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="668" name="__module.encoder.layer.10.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="909,hidden_states.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="669" name="self.encoder.layer.11.attention.self.query.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="378360992" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.11.attention.self.query.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="670" name="__module.encoder.layer.11.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="671" name="Constant_4461844" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="380720288" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="672" name="__module.encoder.layer.11.attention.self.query/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="922,x.133"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="673" name="__module.encoder.layer.11.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="674" name="__module.encoder.layer.11.attention.self/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="926,x.135"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="675" name="Constant_4455101" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="927"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="676" name="__module.encoder.layer.11.attention.self/aten::permute/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="928"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="677" name="self.encoder.layer.11.attention.self.key.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="380723360" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.11.attention.self.key.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="678" name="__module.encoder.layer.11.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="679" name="Constant_4461845" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="383082656" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="680" name="__module.encoder.layer.11.attention.self.key/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="931,x.137"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="681" name="__module.encoder.layer.11.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="682" name="__module.encoder.layer.11.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="935,x.139"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="683" name="Constant_4455124" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="936"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="684" name="__module.encoder.layer.11.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="937"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="685" name="self.encoder.layer.11.attention.self.value.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="383085728" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.11.attention.self.value.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="686" name="__module.encoder.layer.11.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="687" name="Constant_4461846" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="385445024" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="688" name="__module.encoder.layer.11.attention.self.value/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="940,x.141"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="689" name="__module.encoder.layer.11.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856856" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="690" name="__module.encoder.layer.11.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="944,x"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="691" name="Constant_4455147" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="68856888" size="32" /> + <output> + <port id="0" precision="I64" names="945"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="692" name="__module.encoder.layer.11.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="946"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="693" name="__module.encoder.layer.11.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="947,attn_output.45"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="694" name="__module.encoder.layer.11.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="73581688" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="695" name="__module.encoder.layer.11.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>12</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="948,attn_output"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="696" name="Constant_4461987" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="73581704" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="697" name="__module.encoder.layer.11.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>12</dim> + <dim>64</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="950"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="698" name="self.encoder.layer.11.attention.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 768" offset="385448096" size="2359296" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.11.attention.output.dense.weight"> + <dim>768</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="699" name="__module.encoder.layer.11.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="700" name="Constant_4461847" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="387807392" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="701" name="__module.encoder.layer.11.attention.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="956,input.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="702" name="__module.encoder.layer.11.attention.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="958"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="703" name="__module.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="704" name="__module.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="705" name="Constant_4461848" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="387810464" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="706" name="__module.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="707" name="Constant_4461849" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="387813536" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="708" name="__module.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="962,input_tensor"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="709" name="self.encoder.layer.11.intermediate.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="3072, 768" offset="387816608" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.11.intermediate.dense.weight"> + <dim>3072</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="710" name="__module.encoder.layer.11.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>3072</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="711" name="Constant_4461850" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 3072" offset="397253792" size="12288" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="712" name="__module.encoder.layer.11.intermediate.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="967"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="713" name="__module.encoder.layer.11.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> + <data approximation_mode="ERF" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="968"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="714" name="self.encoder.layer.11.output.dense.weight" type="Const" version="opset1"> + <data element_type="f32" shape="768, 3072" offset="397266080" size="9437184" /> + <output> + <port id="0" precision="FP32" names="self.encoder.layer.11.output.dense.weight"> + <dim>768</dim> + <dim>3072</dim> + </port> + </output> + </layer> + <layer id="715" name="__module.encoder.layer.11.output.dense/aten::linear/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>3072</dim> + </port> + <port id="1" precision="FP32"> + <dim>768</dim> + <dim>3072</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="716" name="Constant_4461851" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="406703264" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="717" name="__module.encoder.layer.11.output.dense/aten::linear/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="974,input"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="718" name="__module.encoder.layer.11.output/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="976"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="719" name="__module.encoder.layer.11.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1"> + <data element_type="i32" shape="1" offset="66488340" size="4" /> + <output> + <port id="0" precision="I32"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="720" name="__module.encoder.layer.11.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6"> + <data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="I32"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="721" name="Constant_4461852" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="406706336" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="722" name="__module.encoder.layer.11.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="723" name="Constant_4461853" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 768" offset="406709408" size="3072" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="724" name="__module.encoder.layer.11.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>768</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="last_hidden_state"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </output> + </layer> + <layer id="725" name="Result_4457039" type="Result" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>768</dim> + </port> + </input> + </layer> + </layers> + <edges> + <edge from-layer="0" from-port="0" to-layer="8" to-port="0" /> + <edge from-layer="1" from-port="0" to-layer="58" to-port="0" /> + <edge from-layer="2" from-port="0" to-layer="15" to-port="0" /> + <edge from-layer="2" from-port="0" to-layer="4" to-port="0" /> + <edge from-layer="3" from-port="0" to-layer="6" to-port="0" /> + <edge from-layer="4" from-port="1" to-layer="6" to-port="1" /> + <edge from-layer="5" from-port="0" to-layer="6" to-port="2" /> + <edge from-layer="6" from-port="3" to-layer="11" to-port="0" /> + <edge from-layer="7" from-port="0" to-layer="10" to-port="0" /> + <edge from-layer="8" from-port="1" to-layer="10" to-port="1" /> + <edge from-layer="9" from-port="0" to-layer="10" to-port="2" /> + <edge from-layer="10" from-port="3" to-layer="11" to-port="1" /> + <edge from-layer="11" from-port="2" to-layer="25" to-port="0" /> + <edge from-layer="12" from-port="0" to-layer="24" to-port="0" /> + <edge from-layer="13" from-port="0" to-layer="21" to-port="0" /> + <edge from-layer="14" from-port="0" to-layer="21" to-port="1" /> + <edge from-layer="15" from-port="1" to-layer="63" to-port="0" /> + <edge from-layer="15" from-port="1" to-layer="67" to-port="0" /> + <edge from-layer="15" from-port="1" to-layer="18" to-port="0" /> + <edge from-layer="16" from-port="0" to-layer="18" to-port="1" /> + <edge from-layer="17" from-port="0" to-layer="18" to-port="2" /> + <edge from-layer="18" from-port="3" to-layer="21" to-port="2" /> + <edge from-layer="19" from-port="0" to-layer="21" to-port="3" /> + <edge from-layer="20" from-port="0" to-layer="21" to-port="4" /> + <edge from-layer="21" from-port="5" to-layer="22" to-port="0" /> + <edge from-layer="22" from-port="1" to-layer="24" to-port="1" /> + <edge from-layer="23" from-port="0" to-layer="24" to-port="2" /> + <edge from-layer="24" from-port="3" to-layer="25" to-port="1" /> + <edge from-layer="25" from-port="2" to-layer="27" to-port="0" /> + <edge from-layer="26" from-port="0" to-layer="27" to-port="1" /> + <edge from-layer="27" from-port="2" to-layer="29" to-port="0" /> + <edge from-layer="28" from-port="0" to-layer="29" to-port="1" /> + <edge from-layer="29" from-port="2" to-layer="31" to-port="0" /> + <edge from-layer="30" from-port="0" to-layer="31" to-port="1" /> + <edge from-layer="31" from-port="2" to-layer="86" to-port="1" /> + <edge from-layer="31" from-port="2" to-layer="49" to-port="0" /> + <edge from-layer="31" from-port="2" to-layer="41" to-port="0" /> + <edge from-layer="31" from-port="2" to-layer="33" to-port="0" /> + <edge from-layer="32" from-port="0" to-layer="33" to-port="1" /> + <edge from-layer="33" from-port="2" to-layer="35" to-port="0" /> + <edge from-layer="34" from-port="0" to-layer="35" to-port="1" /> + <edge from-layer="35" from-port="2" to-layer="37" to-port="0" /> + <edge from-layer="36" from-port="0" to-layer="37" to-port="1" /> + <edge from-layer="37" from-port="2" to-layer="39" to-port="0" /> + <edge from-layer="38" from-port="0" to-layer="39" to-port="1" /> + <edge from-layer="39" from-port="2" to-layer="77" to-port="0" /> + <edge from-layer="40" from-port="0" to-layer="41" to-port="1" /> + <edge from-layer="41" from-port="2" to-layer="43" to-port="0" /> + <edge from-layer="42" from-port="0" to-layer="43" to-port="1" /> + <edge from-layer="43" from-port="2" to-layer="45" to-port="0" /> + <edge from-layer="44" from-port="0" to-layer="45" to-port="1" /> + <edge from-layer="45" from-port="2" to-layer="47" to-port="0" /> + <edge from-layer="46" from-port="0" to-layer="47" to-port="1" /> + <edge from-layer="47" from-port="2" to-layer="77" to-port="1" /> + <edge from-layer="48" from-port="0" to-layer="49" to-port="1" /> + <edge from-layer="49" from-port="2" to-layer="51" to-port="0" /> + <edge from-layer="50" from-port="0" to-layer="51" to-port="1" /> + <edge from-layer="51" from-port="2" to-layer="53" to-port="0" /> + <edge from-layer="52" from-port="0" to-layer="53" to-port="1" /> + <edge from-layer="53" from-port="2" to-layer="55" to-port="0" /> + <edge from-layer="54" from-port="0" to-layer="55" to-port="1" /> + <edge from-layer="55" from-port="2" to-layer="77" to-port="2" /> + <edge from-layer="56" from-port="0" to-layer="73" to-port="0" /> + <edge from-layer="57" from-port="0" to-layer="58" to-port="1" /> + <edge from-layer="58" from-port="2" to-layer="60" to-port="0" /> + <edge from-layer="59" from-port="0" to-layer="60" to-port="1" /> + <edge from-layer="60" from-port="2" to-layer="69" to-port="0" /> + <edge from-layer="61" from-port="0" to-layer="63" to-port="1" /> + <edge from-layer="62" from-port="0" to-layer="63" to-port="2" /> + <edge from-layer="63" from-port="3" to-layer="68" to-port="0" /> + <edge from-layer="64" from-port="0" to-layer="68" to-port="1" /> + <edge from-layer="65" from-port="0" to-layer="67" to-port="1" /> + <edge from-layer="66" from-port="0" to-layer="67" to-port="2" /> + <edge from-layer="67" from-port="3" to-layer="68" to-port="2" /> + <edge from-layer="68" from-port="3" to-layer="69" to-port="1" /> + <edge from-layer="69" from-port="2" to-layer="70" to-port="0" /> + <edge from-layer="70" from-port="1" to-layer="72" to-port="0" /> + <edge from-layer="71" from-port="0" to-layer="72" to-port="1" /> + <edge from-layer="72" from-port="2" to-layer="73" to-port="1" /> + <edge from-layer="73" from-port="2" to-layer="74" to-port="0" /> + <edge from-layer="73" from-port="2" to-layer="76" to-port="2" /> + <edge from-layer="74" from-port="1" to-layer="76" to-port="0" /> + <edge from-layer="75" from-port="0" to-layer="76" to-port="1" /> + <edge from-layer="76" from-port="3" to-layer="133" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="413" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="189" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="245" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="301" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="357" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="693" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="637" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="581" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="525" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="469" to-port="3" /> + <edge from-layer="76" from-port="3" to-layer="77" to-port="3" /> + <edge from-layer="77" from-port="4" to-layer="79" to-port="0" /> + <edge from-layer="78" from-port="0" to-layer="79" to-port="1" /> + <edge from-layer="79" from-port="2" to-layer="81" to-port="0" /> + <edge from-layer="80" from-port="0" to-layer="81" to-port="1" /> + <edge from-layer="81" from-port="2" to-layer="83" to-port="0" /> + <edge from-layer="82" from-port="0" to-layer="83" to-port="1" /> + <edge from-layer="83" from-port="2" to-layer="85" to-port="0" /> + <edge from-layer="84" from-port="0" to-layer="85" to-port="1" /> + <edge from-layer="85" from-port="2" to-layer="86" to-port="0" /> + <edge from-layer="86" from-port="2" to-layer="88" to-port="0" /> + <edge from-layer="87" from-port="0" to-layer="88" to-port="1" /> + <edge from-layer="88" from-port="2" to-layer="90" to-port="0" /> + <edge from-layer="89" from-port="0" to-layer="90" to-port="1" /> + <edge from-layer="90" from-port="2" to-layer="92" to-port="0" /> + <edge from-layer="91" from-port="0" to-layer="92" to-port="1" /> + <edge from-layer="92" from-port="2" to-layer="102" to-port="1" /> + <edge from-layer="92" from-port="2" to-layer="94" to-port="0" /> + <edge from-layer="93" from-port="0" to-layer="94" to-port="1" /> + <edge from-layer="94" from-port="2" to-layer="96" to-port="0" /> + <edge from-layer="95" from-port="0" to-layer="96" to-port="1" /> + <edge from-layer="96" from-port="2" to-layer="97" to-port="0" /> + <edge from-layer="97" from-port="1" to-layer="99" to-port="0" /> + <edge from-layer="98" from-port="0" to-layer="99" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="101" to-port="0" /> + <edge from-layer="100" from-port="0" to-layer="101" to-port="1" /> + <edge from-layer="101" from-port="2" to-layer="102" to-port="0" /> + <edge from-layer="102" from-port="2" to-layer="104" to-port="0" /> + <edge from-layer="103" from-port="0" to-layer="104" to-port="1" /> + <edge from-layer="104" from-port="2" to-layer="106" to-port="0" /> + <edge from-layer="105" from-port="0" to-layer="106" to-port="1" /> + <edge from-layer="106" from-port="2" to-layer="108" to-port="0" /> + <edge from-layer="107" from-port="0" to-layer="108" to-port="1" /> + <edge from-layer="108" from-port="2" to-layer="118" to-port="0" /> + <edge from-layer="108" from-port="2" to-layer="110" to-port="0" /> + <edge from-layer="108" from-port="2" to-layer="126" to-port="0" /> + <edge from-layer="108" from-port="2" to-layer="142" to-port="1" /> + <edge from-layer="109" from-port="0" to-layer="110" to-port="1" /> + <edge from-layer="110" from-port="2" to-layer="112" to-port="0" /> + <edge from-layer="111" from-port="0" to-layer="112" to-port="1" /> + <edge from-layer="112" from-port="2" to-layer="114" to-port="0" /> + <edge from-layer="113" from-port="0" to-layer="114" to-port="1" /> + <edge from-layer="114" from-port="2" to-layer="116" to-port="0" /> + <edge from-layer="115" from-port="0" to-layer="116" to-port="1" /> + <edge from-layer="116" from-port="2" to-layer="133" to-port="0" /> + <edge from-layer="117" from-port="0" to-layer="118" to-port="1" /> + <edge from-layer="118" from-port="2" to-layer="120" to-port="0" /> + <edge from-layer="119" from-port="0" to-layer="120" to-port="1" /> + <edge from-layer="120" from-port="2" to-layer="122" to-port="0" /> + <edge from-layer="121" from-port="0" to-layer="122" to-port="1" /> + <edge from-layer="122" from-port="2" to-layer="124" to-port="0" /> + <edge from-layer="123" from-port="0" to-layer="124" to-port="1" /> + <edge from-layer="124" from-port="2" to-layer="133" to-port="1" /> + <edge from-layer="125" from-port="0" to-layer="126" to-port="1" /> + <edge from-layer="126" from-port="2" to-layer="128" to-port="0" /> + <edge from-layer="127" from-port="0" to-layer="128" to-port="1" /> + <edge from-layer="128" from-port="2" to-layer="130" to-port="0" /> + <edge from-layer="129" from-port="0" to-layer="130" to-port="1" /> + <edge from-layer="130" from-port="2" to-layer="132" to-port="0" /> + <edge from-layer="131" from-port="0" to-layer="132" to-port="1" /> + <edge from-layer="132" from-port="2" to-layer="133" to-port="2" /> + <edge from-layer="133" from-port="4" to-layer="135" to-port="0" /> + <edge from-layer="134" from-port="0" to-layer="135" to-port="1" /> + <edge from-layer="135" from-port="2" to-layer="137" to-port="0" /> + <edge from-layer="136" from-port="0" to-layer="137" to-port="1" /> + <edge from-layer="137" from-port="2" to-layer="139" to-port="0" /> + <edge from-layer="138" from-port="0" to-layer="139" to-port="1" /> + <edge from-layer="139" from-port="2" to-layer="141" to-port="0" /> + <edge from-layer="140" from-port="0" to-layer="141" to-port="1" /> + <edge from-layer="141" from-port="2" to-layer="142" to-port="0" /> + <edge from-layer="142" from-port="2" to-layer="144" to-port="0" /> + <edge from-layer="143" from-port="0" to-layer="144" to-port="1" /> + <edge from-layer="144" from-port="2" to-layer="146" to-port="0" /> + <edge from-layer="145" from-port="0" to-layer="146" to-port="1" /> + <edge from-layer="146" from-port="2" to-layer="148" to-port="0" /> + <edge from-layer="147" from-port="0" to-layer="148" to-port="1" /> + <edge from-layer="148" from-port="2" to-layer="158" to-port="1" /> + <edge from-layer="148" from-port="2" to-layer="150" to-port="0" /> + <edge from-layer="149" from-port="0" to-layer="150" to-port="1" /> + <edge from-layer="150" from-port="2" to-layer="152" to-port="0" /> + <edge from-layer="151" from-port="0" to-layer="152" to-port="1" /> + <edge from-layer="152" from-port="2" to-layer="153" to-port="0" /> + <edge from-layer="153" from-port="1" to-layer="155" to-port="0" /> + <edge from-layer="154" from-port="0" to-layer="155" to-port="1" /> + <edge from-layer="155" from-port="2" to-layer="157" to-port="0" /> + <edge from-layer="156" from-port="0" to-layer="157" to-port="1" /> + <edge from-layer="157" from-port="2" to-layer="158" to-port="0" /> + <edge from-layer="158" from-port="2" to-layer="160" to-port="0" /> + <edge from-layer="159" from-port="0" to-layer="160" to-port="1" /> + <edge from-layer="160" from-port="2" to-layer="162" to-port="0" /> + <edge from-layer="161" from-port="0" to-layer="162" to-port="1" /> + <edge from-layer="162" from-port="2" to-layer="164" to-port="0" /> + <edge from-layer="163" from-port="0" to-layer="164" to-port="1" /> + <edge from-layer="164" from-port="2" to-layer="198" to-port="1" /> + <edge from-layer="164" from-port="2" to-layer="166" to-port="0" /> + <edge from-layer="164" from-port="2" to-layer="182" to-port="0" /> + <edge from-layer="164" from-port="2" to-layer="174" to-port="0" /> + <edge from-layer="165" from-port="0" to-layer="166" to-port="1" /> + <edge from-layer="166" from-port="2" to-layer="168" to-port="0" /> + <edge from-layer="167" from-port="0" to-layer="168" to-port="1" /> + <edge from-layer="168" from-port="2" to-layer="170" to-port="0" /> + <edge from-layer="169" from-port="0" to-layer="170" to-port="1" /> + <edge from-layer="170" from-port="2" to-layer="172" to-port="0" /> + <edge from-layer="171" from-port="0" to-layer="172" to-port="1" /> + <edge from-layer="172" from-port="2" to-layer="189" to-port="0" /> + <edge from-layer="173" from-port="0" to-layer="174" to-port="1" /> + <edge from-layer="174" from-port="2" to-layer="176" to-port="0" /> + <edge from-layer="175" from-port="0" to-layer="176" to-port="1" /> + <edge from-layer="176" from-port="2" to-layer="178" to-port="0" /> + <edge from-layer="177" from-port="0" to-layer="178" to-port="1" /> + <edge from-layer="178" from-port="2" to-layer="180" to-port="0" /> + <edge from-layer="179" from-port="0" to-layer="180" to-port="1" /> + <edge from-layer="180" from-port="2" to-layer="189" to-port="1" /> + <edge from-layer="181" from-port="0" to-layer="182" to-port="1" /> + <edge from-layer="182" from-port="2" to-layer="184" to-port="0" /> + <edge from-layer="183" from-port="0" to-layer="184" to-port="1" /> + <edge from-layer="184" from-port="2" to-layer="186" to-port="0" /> + <edge from-layer="185" from-port="0" to-layer="186" to-port="1" /> + <edge from-layer="186" from-port="2" to-layer="188" to-port="0" /> + <edge from-layer="187" from-port="0" to-layer="188" to-port="1" /> + <edge from-layer="188" from-port="2" to-layer="189" to-port="2" /> + <edge from-layer="189" from-port="4" to-layer="191" to-port="0" /> + <edge from-layer="190" from-port="0" to-layer="191" to-port="1" /> + <edge from-layer="191" from-port="2" to-layer="193" to-port="0" /> + <edge from-layer="192" from-port="0" to-layer="193" to-port="1" /> + <edge from-layer="193" from-port="2" to-layer="195" to-port="0" /> + <edge from-layer="194" from-port="0" to-layer="195" to-port="1" /> + <edge from-layer="195" from-port="2" to-layer="197" to-port="0" /> + <edge from-layer="196" from-port="0" to-layer="197" to-port="1" /> + <edge from-layer="197" from-port="2" to-layer="198" to-port="0" /> + <edge from-layer="198" from-port="2" to-layer="200" to-port="0" /> + <edge from-layer="199" from-port="0" to-layer="200" to-port="1" /> + <edge from-layer="200" from-port="2" to-layer="202" to-port="0" /> + <edge from-layer="201" from-port="0" to-layer="202" to-port="1" /> + <edge from-layer="202" from-port="2" to-layer="204" to-port="0" /> + <edge from-layer="203" from-port="0" to-layer="204" to-port="1" /> + <edge from-layer="204" from-port="2" to-layer="214" to-port="1" /> + <edge from-layer="204" from-port="2" to-layer="206" to-port="0" /> + <edge from-layer="205" from-port="0" to-layer="206" to-port="1" /> + <edge from-layer="206" from-port="2" to-layer="208" to-port="0" /> + <edge from-layer="207" from-port="0" to-layer="208" to-port="1" /> + <edge from-layer="208" from-port="2" to-layer="209" to-port="0" /> + <edge from-layer="209" from-port="1" to-layer="211" to-port="0" /> + <edge from-layer="210" from-port="0" to-layer="211" to-port="1" /> + <edge from-layer="211" from-port="2" to-layer="213" to-port="0" /> + <edge from-layer="212" from-port="0" to-layer="213" to-port="1" /> + <edge from-layer="213" from-port="2" to-layer="214" to-port="0" /> + <edge from-layer="214" from-port="2" to-layer="216" to-port="0" /> + <edge from-layer="215" from-port="0" to-layer="216" to-port="1" /> + <edge from-layer="216" from-port="2" to-layer="218" to-port="0" /> + <edge from-layer="217" from-port="0" to-layer="218" to-port="1" /> + <edge from-layer="218" from-port="2" to-layer="220" to-port="0" /> + <edge from-layer="219" from-port="0" to-layer="220" to-port="1" /> + <edge from-layer="220" from-port="2" to-layer="230" to-port="0" /> + <edge from-layer="220" from-port="2" to-layer="238" to-port="0" /> + <edge from-layer="220" from-port="2" to-layer="222" to-port="0" /> + <edge from-layer="220" from-port="2" to-layer="254" to-port="1" /> + <edge from-layer="221" from-port="0" to-layer="222" to-port="1" /> + <edge from-layer="222" from-port="2" to-layer="224" to-port="0" /> + <edge from-layer="223" from-port="0" to-layer="224" to-port="1" /> + <edge from-layer="224" from-port="2" to-layer="226" to-port="0" /> + <edge from-layer="225" from-port="0" to-layer="226" to-port="1" /> + <edge from-layer="226" from-port="2" to-layer="228" to-port="0" /> + <edge from-layer="227" from-port="0" to-layer="228" to-port="1" /> + <edge from-layer="228" from-port="2" to-layer="245" to-port="0" /> + <edge from-layer="229" from-port="0" to-layer="230" to-port="1" /> + <edge from-layer="230" from-port="2" to-layer="232" to-port="0" /> + <edge from-layer="231" from-port="0" to-layer="232" to-port="1" /> + <edge from-layer="232" from-port="2" to-layer="234" to-port="0" /> + <edge from-layer="233" from-port="0" to-layer="234" to-port="1" /> + <edge from-layer="234" from-port="2" to-layer="236" to-port="0" /> + <edge from-layer="235" from-port="0" to-layer="236" to-port="1" /> + <edge from-layer="236" from-port="2" to-layer="245" to-port="1" /> + <edge from-layer="237" from-port="0" to-layer="238" to-port="1" /> + <edge from-layer="238" from-port="2" to-layer="240" to-port="0" /> + <edge from-layer="239" from-port="0" to-layer="240" to-port="1" /> + <edge from-layer="240" from-port="2" to-layer="242" to-port="0" /> + <edge from-layer="241" from-port="0" to-layer="242" to-port="1" /> + <edge from-layer="242" from-port="2" to-layer="244" to-port="0" /> + <edge from-layer="243" from-port="0" to-layer="244" to-port="1" /> + <edge from-layer="244" from-port="2" to-layer="245" to-port="2" /> + <edge from-layer="245" from-port="4" to-layer="247" to-port="0" /> + <edge from-layer="246" from-port="0" to-layer="247" to-port="1" /> + <edge from-layer="247" from-port="2" to-layer="249" to-port="0" /> + <edge from-layer="248" from-port="0" to-layer="249" to-port="1" /> + <edge from-layer="249" from-port="2" to-layer="251" to-port="0" /> + <edge from-layer="250" from-port="0" to-layer="251" to-port="1" /> + <edge from-layer="251" from-port="2" to-layer="253" to-port="0" /> + <edge from-layer="252" from-port="0" to-layer="253" to-port="1" /> + <edge from-layer="253" from-port="2" to-layer="254" to-port="0" /> + <edge from-layer="254" from-port="2" to-layer="256" to-port="0" /> + <edge from-layer="255" from-port="0" to-layer="256" to-port="1" /> + <edge from-layer="256" from-port="2" to-layer="258" to-port="0" /> + <edge from-layer="257" from-port="0" to-layer="258" to-port="1" /> + <edge from-layer="258" from-port="2" to-layer="260" to-port="0" /> + <edge from-layer="259" from-port="0" to-layer="260" to-port="1" /> + <edge from-layer="260" from-port="2" to-layer="262" to-port="0" /> + <edge from-layer="260" from-port="2" to-layer="270" to-port="1" /> + <edge from-layer="261" from-port="0" to-layer="262" to-port="1" /> + <edge from-layer="262" from-port="2" to-layer="264" to-port="0" /> + <edge from-layer="263" from-port="0" to-layer="264" to-port="1" /> + <edge from-layer="264" from-port="2" to-layer="265" to-port="0" /> + <edge from-layer="265" from-port="1" to-layer="267" to-port="0" /> + <edge from-layer="266" from-port="0" to-layer="267" to-port="1" /> + <edge from-layer="267" from-port="2" to-layer="269" to-port="0" /> + <edge from-layer="268" from-port="0" to-layer="269" to-port="1" /> + <edge from-layer="269" from-port="2" to-layer="270" to-port="0" /> + <edge from-layer="270" from-port="2" to-layer="272" to-port="0" /> + <edge from-layer="271" from-port="0" to-layer="272" to-port="1" /> + <edge from-layer="272" from-port="2" to-layer="274" to-port="0" /> + <edge from-layer="273" from-port="0" to-layer="274" to-port="1" /> + <edge from-layer="274" from-port="2" to-layer="276" to-port="0" /> + <edge from-layer="275" from-port="0" to-layer="276" to-port="1" /> + <edge from-layer="276" from-port="2" to-layer="294" to-port="0" /> + <edge from-layer="276" from-port="2" to-layer="286" to-port="0" /> + <edge from-layer="276" from-port="2" to-layer="278" to-port="0" /> + <edge from-layer="276" from-port="2" to-layer="310" to-port="1" /> + <edge from-layer="277" from-port="0" to-layer="278" to-port="1" /> + <edge from-layer="278" from-port="2" to-layer="280" to-port="0" /> + <edge from-layer="279" from-port="0" to-layer="280" to-port="1" /> + <edge from-layer="280" from-port="2" to-layer="282" to-port="0" /> + <edge from-layer="281" from-port="0" to-layer="282" to-port="1" /> + <edge from-layer="282" from-port="2" to-layer="284" to-port="0" /> + <edge from-layer="283" from-port="0" to-layer="284" to-port="1" /> + <edge from-layer="284" from-port="2" to-layer="301" to-port="0" /> + <edge from-layer="285" from-port="0" to-layer="286" to-port="1" /> + <edge from-layer="286" from-port="2" to-layer="288" to-port="0" /> + <edge from-layer="287" from-port="0" to-layer="288" to-port="1" /> + <edge from-layer="288" from-port="2" to-layer="290" to-port="0" /> + <edge from-layer="289" from-port="0" to-layer="290" to-port="1" /> + <edge from-layer="290" from-port="2" to-layer="292" to-port="0" /> + <edge from-layer="291" from-port="0" to-layer="292" to-port="1" /> + <edge from-layer="292" from-port="2" to-layer="301" to-port="1" /> + <edge from-layer="293" from-port="0" to-layer="294" to-port="1" /> + <edge from-layer="294" from-port="2" to-layer="296" to-port="0" /> + <edge from-layer="295" from-port="0" to-layer="296" to-port="1" /> + <edge from-layer="296" from-port="2" to-layer="298" to-port="0" /> + <edge from-layer="297" from-port="0" to-layer="298" to-port="1" /> + <edge from-layer="298" from-port="2" to-layer="300" to-port="0" /> + <edge from-layer="299" from-port="0" to-layer="300" to-port="1" /> + <edge from-layer="300" from-port="2" to-layer="301" to-port="2" /> + <edge from-layer="301" from-port="4" to-layer="303" to-port="0" /> + <edge from-layer="302" from-port="0" to-layer="303" to-port="1" /> + <edge from-layer="303" from-port="2" to-layer="305" to-port="0" /> + <edge from-layer="304" from-port="0" to-layer="305" to-port="1" /> + <edge from-layer="305" from-port="2" to-layer="307" to-port="0" /> + <edge from-layer="306" from-port="0" to-layer="307" to-port="1" /> + <edge from-layer="307" from-port="2" to-layer="309" to-port="0" /> + <edge from-layer="308" from-port="0" to-layer="309" to-port="1" /> + <edge from-layer="309" from-port="2" to-layer="310" to-port="0" /> + <edge from-layer="310" from-port="2" to-layer="312" to-port="0" /> + <edge from-layer="311" from-port="0" to-layer="312" to-port="1" /> + <edge from-layer="312" from-port="2" to-layer="314" to-port="0" /> + <edge from-layer="313" from-port="0" to-layer="314" to-port="1" /> + <edge from-layer="314" from-port="2" to-layer="316" to-port="0" /> + <edge from-layer="315" from-port="0" to-layer="316" to-port="1" /> + <edge from-layer="316" from-port="2" to-layer="318" to-port="0" /> + <edge from-layer="316" from-port="2" to-layer="326" to-port="1" /> + <edge from-layer="317" from-port="0" to-layer="318" to-port="1" /> + <edge from-layer="318" from-port="2" to-layer="320" to-port="0" /> + <edge from-layer="319" from-port="0" to-layer="320" to-port="1" /> + <edge from-layer="320" from-port="2" to-layer="321" to-port="0" /> + <edge from-layer="321" from-port="1" to-layer="323" to-port="0" /> + <edge from-layer="322" from-port="0" to-layer="323" to-port="1" /> + <edge from-layer="323" from-port="2" to-layer="325" to-port="0" /> + <edge from-layer="324" from-port="0" to-layer="325" to-port="1" /> + <edge from-layer="325" from-port="2" to-layer="326" to-port="0" /> + <edge from-layer="326" from-port="2" to-layer="328" to-port="0" /> + <edge from-layer="327" from-port="0" to-layer="328" to-port="1" /> + <edge from-layer="328" from-port="2" to-layer="330" to-port="0" /> + <edge from-layer="329" from-port="0" to-layer="330" to-port="1" /> + <edge from-layer="330" from-port="2" to-layer="332" to-port="0" /> + <edge from-layer="331" from-port="0" to-layer="332" to-port="1" /> + <edge from-layer="332" from-port="2" to-layer="334" to-port="0" /> + <edge from-layer="332" from-port="2" to-layer="342" to-port="0" /> + <edge from-layer="332" from-port="2" to-layer="366" to-port="1" /> + <edge from-layer="332" from-port="2" to-layer="350" to-port="0" /> + <edge from-layer="333" from-port="0" to-layer="334" to-port="1" /> + <edge from-layer="334" from-port="2" to-layer="336" to-port="0" /> + <edge from-layer="335" from-port="0" to-layer="336" to-port="1" /> + <edge from-layer="336" from-port="2" to-layer="338" to-port="0" /> + <edge from-layer="337" from-port="0" to-layer="338" to-port="1" /> + <edge from-layer="338" from-port="2" to-layer="340" to-port="0" /> + <edge from-layer="339" from-port="0" to-layer="340" to-port="1" /> + <edge from-layer="340" from-port="2" to-layer="357" to-port="0" /> + <edge from-layer="341" from-port="0" to-layer="342" to-port="1" /> + <edge from-layer="342" from-port="2" to-layer="344" to-port="0" /> + <edge from-layer="343" from-port="0" to-layer="344" to-port="1" /> + <edge from-layer="344" from-port="2" to-layer="346" to-port="0" /> + <edge from-layer="345" from-port="0" to-layer="346" to-port="1" /> + <edge from-layer="346" from-port="2" to-layer="348" to-port="0" /> + <edge from-layer="347" from-port="0" to-layer="348" to-port="1" /> + <edge from-layer="348" from-port="2" to-layer="357" to-port="1" /> + <edge from-layer="349" from-port="0" to-layer="350" to-port="1" /> + <edge from-layer="350" from-port="2" to-layer="352" to-port="0" /> + <edge from-layer="351" from-port="0" to-layer="352" to-port="1" /> + <edge from-layer="352" from-port="2" to-layer="354" to-port="0" /> + <edge from-layer="353" from-port="0" to-layer="354" to-port="1" /> + <edge from-layer="354" from-port="2" to-layer="356" to-port="0" /> + <edge from-layer="355" from-port="0" to-layer="356" to-port="1" /> + <edge from-layer="356" from-port="2" to-layer="357" to-port="2" /> + <edge from-layer="357" from-port="4" to-layer="359" to-port="0" /> + <edge from-layer="358" from-port="0" to-layer="359" to-port="1" /> + <edge from-layer="359" from-port="2" to-layer="361" to-port="0" /> + <edge from-layer="360" from-port="0" to-layer="361" to-port="1" /> + <edge from-layer="361" from-port="2" to-layer="363" to-port="0" /> + <edge from-layer="362" from-port="0" to-layer="363" to-port="1" /> + <edge from-layer="363" from-port="2" to-layer="365" to-port="0" /> + <edge from-layer="364" from-port="0" to-layer="365" to-port="1" /> + <edge from-layer="365" from-port="2" to-layer="366" to-port="0" /> + <edge from-layer="366" from-port="2" to-layer="368" to-port="0" /> + <edge from-layer="367" from-port="0" to-layer="368" to-port="1" /> + <edge from-layer="368" from-port="2" to-layer="370" to-port="0" /> + <edge from-layer="369" from-port="0" to-layer="370" to-port="1" /> + <edge from-layer="370" from-port="2" to-layer="372" to-port="0" /> + <edge from-layer="371" from-port="0" to-layer="372" to-port="1" /> + <edge from-layer="372" from-port="2" to-layer="374" to-port="0" /> + <edge from-layer="372" from-port="2" to-layer="382" to-port="1" /> + <edge from-layer="373" from-port="0" to-layer="374" to-port="1" /> + <edge from-layer="374" from-port="2" to-layer="376" to-port="0" /> + <edge from-layer="375" from-port="0" to-layer="376" to-port="1" /> + <edge from-layer="376" from-port="2" to-layer="377" to-port="0" /> + <edge from-layer="377" from-port="1" to-layer="379" to-port="0" /> + <edge from-layer="378" from-port="0" to-layer="379" to-port="1" /> + <edge from-layer="379" from-port="2" to-layer="381" to-port="0" /> + <edge from-layer="380" from-port="0" to-layer="381" to-port="1" /> + <edge from-layer="381" from-port="2" to-layer="382" to-port="0" /> + <edge from-layer="382" from-port="2" to-layer="384" to-port="0" /> + <edge from-layer="383" from-port="0" to-layer="384" to-port="1" /> + <edge from-layer="384" from-port="2" to-layer="386" to-port="0" /> + <edge from-layer="385" from-port="0" to-layer="386" to-port="1" /> + <edge from-layer="386" from-port="2" to-layer="388" to-port="0" /> + <edge from-layer="387" from-port="0" to-layer="388" to-port="1" /> + <edge from-layer="388" from-port="2" to-layer="422" to-port="1" /> + <edge from-layer="388" from-port="2" to-layer="406" to-port="0" /> + <edge from-layer="388" from-port="2" to-layer="390" to-port="0" /> + <edge from-layer="388" from-port="2" to-layer="398" to-port="0" /> + <edge from-layer="389" from-port="0" to-layer="390" to-port="1" /> + <edge from-layer="390" from-port="2" to-layer="392" to-port="0" /> + <edge from-layer="391" from-port="0" to-layer="392" to-port="1" /> + <edge from-layer="392" from-port="2" to-layer="394" to-port="0" /> + <edge from-layer="393" from-port="0" to-layer="394" to-port="1" /> + <edge from-layer="394" from-port="2" to-layer="396" to-port="0" /> + <edge from-layer="395" from-port="0" to-layer="396" to-port="1" /> + <edge from-layer="396" from-port="2" to-layer="413" to-port="0" /> + <edge from-layer="397" from-port="0" to-layer="398" to-port="1" /> + <edge from-layer="398" from-port="2" to-layer="400" to-port="0" /> + <edge from-layer="399" from-port="0" to-layer="400" to-port="1" /> + <edge from-layer="400" from-port="2" to-layer="402" to-port="0" /> + <edge from-layer="401" from-port="0" to-layer="402" to-port="1" /> + <edge from-layer="402" from-port="2" to-layer="404" to-port="0" /> + <edge from-layer="403" from-port="0" to-layer="404" to-port="1" /> + <edge from-layer="404" from-port="2" to-layer="413" to-port="1" /> + <edge from-layer="405" from-port="0" to-layer="406" to-port="1" /> + <edge from-layer="406" from-port="2" to-layer="408" to-port="0" /> + <edge from-layer="407" from-port="0" to-layer="408" to-port="1" /> + <edge from-layer="408" from-port="2" to-layer="410" to-port="0" /> + <edge from-layer="409" from-port="0" to-layer="410" to-port="1" /> + <edge from-layer="410" from-port="2" to-layer="412" to-port="0" /> + <edge from-layer="411" from-port="0" to-layer="412" to-port="1" /> + <edge from-layer="412" from-port="2" to-layer="413" to-port="2" /> + <edge from-layer="413" from-port="4" to-layer="415" to-port="0" /> + <edge from-layer="414" from-port="0" to-layer="415" to-port="1" /> + <edge from-layer="415" from-port="2" to-layer="417" to-port="0" /> + <edge from-layer="416" from-port="0" to-layer="417" to-port="1" /> + <edge from-layer="417" from-port="2" to-layer="419" to-port="0" /> + <edge from-layer="418" from-port="0" to-layer="419" to-port="1" /> + <edge from-layer="419" from-port="2" to-layer="421" to-port="0" /> + <edge from-layer="420" from-port="0" to-layer="421" to-port="1" /> + <edge from-layer="421" from-port="2" to-layer="422" to-port="0" /> + <edge from-layer="422" from-port="2" to-layer="424" to-port="0" /> + <edge from-layer="423" from-port="0" to-layer="424" to-port="1" /> + <edge from-layer="424" from-port="2" to-layer="426" to-port="0" /> + <edge from-layer="425" from-port="0" to-layer="426" to-port="1" /> + <edge from-layer="426" from-port="2" to-layer="428" to-port="0" /> + <edge from-layer="427" from-port="0" to-layer="428" to-port="1" /> + <edge from-layer="428" from-port="2" to-layer="430" to-port="0" /> + <edge from-layer="428" from-port="2" to-layer="438" to-port="1" /> + <edge from-layer="429" from-port="0" to-layer="430" to-port="1" /> + <edge from-layer="430" from-port="2" to-layer="432" to-port="0" /> + <edge from-layer="431" from-port="0" to-layer="432" to-port="1" /> + <edge from-layer="432" from-port="2" to-layer="433" to-port="0" /> + <edge from-layer="433" from-port="1" to-layer="435" to-port="0" /> + <edge from-layer="434" from-port="0" to-layer="435" to-port="1" /> + <edge from-layer="435" from-port="2" to-layer="437" to-port="0" /> + <edge from-layer="436" from-port="0" to-layer="437" to-port="1" /> + <edge from-layer="437" from-port="2" to-layer="438" to-port="0" /> + <edge from-layer="438" from-port="2" to-layer="440" to-port="0" /> + <edge from-layer="439" from-port="0" to-layer="440" to-port="1" /> + <edge from-layer="440" from-port="2" to-layer="442" to-port="0" /> + <edge from-layer="441" from-port="0" to-layer="442" to-port="1" /> + <edge from-layer="442" from-port="2" to-layer="444" to-port="0" /> + <edge from-layer="443" from-port="0" to-layer="444" to-port="1" /> + <edge from-layer="444" from-port="2" to-layer="478" to-port="1" /> + <edge from-layer="444" from-port="2" to-layer="462" to-port="0" /> + <edge from-layer="444" from-port="2" to-layer="454" to-port="0" /> + <edge from-layer="444" from-port="2" to-layer="446" to-port="0" /> + <edge from-layer="445" from-port="0" to-layer="446" to-port="1" /> + <edge from-layer="446" from-port="2" to-layer="448" to-port="0" /> + <edge from-layer="447" from-port="0" to-layer="448" to-port="1" /> + <edge from-layer="448" from-port="2" to-layer="450" to-port="0" /> + <edge from-layer="449" from-port="0" to-layer="450" to-port="1" /> + <edge from-layer="450" from-port="2" to-layer="452" to-port="0" /> + <edge from-layer="451" from-port="0" to-layer="452" to-port="1" /> + <edge from-layer="452" from-port="2" to-layer="469" to-port="0" /> + <edge from-layer="453" from-port="0" to-layer="454" to-port="1" /> + <edge from-layer="454" from-port="2" to-layer="456" to-port="0" /> + <edge from-layer="455" from-port="0" to-layer="456" to-port="1" /> + <edge from-layer="456" from-port="2" to-layer="458" to-port="0" /> + <edge from-layer="457" from-port="0" to-layer="458" to-port="1" /> + <edge from-layer="458" from-port="2" to-layer="460" to-port="0" /> + <edge from-layer="459" from-port="0" to-layer="460" to-port="1" /> + <edge from-layer="460" from-port="2" to-layer="469" to-port="1" /> + <edge from-layer="461" from-port="0" to-layer="462" to-port="1" /> + <edge from-layer="462" from-port="2" to-layer="464" to-port="0" /> + <edge from-layer="463" from-port="0" to-layer="464" to-port="1" /> + <edge from-layer="464" from-port="2" to-layer="466" to-port="0" /> + <edge from-layer="465" from-port="0" to-layer="466" to-port="1" /> + <edge from-layer="466" from-port="2" to-layer="468" to-port="0" /> + <edge from-layer="467" from-port="0" to-layer="468" to-port="1" /> + <edge from-layer="468" from-port="2" to-layer="469" to-port="2" /> + <edge from-layer="469" from-port="4" to-layer="471" to-port="0" /> + <edge from-layer="470" from-port="0" to-layer="471" to-port="1" /> + <edge from-layer="471" from-port="2" to-layer="473" to-port="0" /> + <edge from-layer="472" from-port="0" to-layer="473" to-port="1" /> + <edge from-layer="473" from-port="2" to-layer="475" to-port="0" /> + <edge from-layer="474" from-port="0" to-layer="475" to-port="1" /> + <edge from-layer="475" from-port="2" to-layer="477" to-port="0" /> + <edge from-layer="476" from-port="0" to-layer="477" to-port="1" /> + <edge from-layer="477" from-port="2" to-layer="478" to-port="0" /> + <edge from-layer="478" from-port="2" to-layer="480" to-port="0" /> + <edge from-layer="479" from-port="0" to-layer="480" to-port="1" /> + <edge from-layer="480" from-port="2" to-layer="482" to-port="0" /> + <edge from-layer="481" from-port="0" to-layer="482" to-port="1" /> + <edge from-layer="482" from-port="2" to-layer="484" to-port="0" /> + <edge from-layer="483" from-port="0" to-layer="484" to-port="1" /> + <edge from-layer="484" from-port="2" to-layer="486" to-port="0" /> + <edge from-layer="484" from-port="2" to-layer="494" to-port="1" /> + <edge from-layer="485" from-port="0" to-layer="486" to-port="1" /> + <edge from-layer="486" from-port="2" to-layer="488" to-port="0" /> + <edge from-layer="487" from-port="0" to-layer="488" to-port="1" /> + <edge from-layer="488" from-port="2" to-layer="489" to-port="0" /> + <edge from-layer="489" from-port="1" to-layer="491" to-port="0" /> + <edge from-layer="490" from-port="0" to-layer="491" to-port="1" /> + <edge from-layer="491" from-port="2" to-layer="493" to-port="0" /> + <edge from-layer="492" from-port="0" to-layer="493" to-port="1" /> + <edge from-layer="493" from-port="2" to-layer="494" to-port="0" /> + <edge from-layer="494" from-port="2" to-layer="496" to-port="0" /> + <edge from-layer="495" from-port="0" to-layer="496" to-port="1" /> + <edge from-layer="496" from-port="2" to-layer="498" to-port="0" /> + <edge from-layer="497" from-port="0" to-layer="498" to-port="1" /> + <edge from-layer="498" from-port="2" to-layer="500" to-port="0" /> + <edge from-layer="499" from-port="0" to-layer="500" to-port="1" /> + <edge from-layer="500" from-port="2" to-layer="510" to-port="0" /> + <edge from-layer="500" from-port="2" to-layer="534" to-port="1" /> + <edge from-layer="500" from-port="2" to-layer="518" to-port="0" /> + <edge from-layer="500" from-port="2" to-layer="502" to-port="0" /> + <edge from-layer="501" from-port="0" to-layer="502" to-port="1" /> + <edge from-layer="502" from-port="2" to-layer="504" to-port="0" /> + <edge from-layer="503" from-port="0" to-layer="504" to-port="1" /> + <edge from-layer="504" from-port="2" to-layer="506" to-port="0" /> + <edge from-layer="505" from-port="0" to-layer="506" to-port="1" /> + <edge from-layer="506" from-port="2" to-layer="508" to-port="0" /> + <edge from-layer="507" from-port="0" to-layer="508" to-port="1" /> + <edge from-layer="508" from-port="2" to-layer="525" to-port="0" /> + <edge from-layer="509" from-port="0" to-layer="510" to-port="1" /> + <edge from-layer="510" from-port="2" to-layer="512" to-port="0" /> + <edge from-layer="511" from-port="0" to-layer="512" to-port="1" /> + <edge from-layer="512" from-port="2" to-layer="514" to-port="0" /> + <edge from-layer="513" from-port="0" to-layer="514" to-port="1" /> + <edge from-layer="514" from-port="2" to-layer="516" to-port="0" /> + <edge from-layer="515" from-port="0" to-layer="516" to-port="1" /> + <edge from-layer="516" from-port="2" to-layer="525" to-port="1" /> + <edge from-layer="517" from-port="0" to-layer="518" to-port="1" /> + <edge from-layer="518" from-port="2" to-layer="520" to-port="0" /> + <edge from-layer="519" from-port="0" to-layer="520" to-port="1" /> + <edge from-layer="520" from-port="2" to-layer="522" to-port="0" /> + <edge from-layer="521" from-port="0" to-layer="522" to-port="1" /> + <edge from-layer="522" from-port="2" to-layer="524" to-port="0" /> + <edge from-layer="523" from-port="0" to-layer="524" to-port="1" /> + <edge from-layer="524" from-port="2" to-layer="525" to-port="2" /> + <edge from-layer="525" from-port="4" to-layer="527" to-port="0" /> + <edge from-layer="526" from-port="0" to-layer="527" to-port="1" /> + <edge from-layer="527" from-port="2" to-layer="529" to-port="0" /> + <edge from-layer="528" from-port="0" to-layer="529" to-port="1" /> + <edge from-layer="529" from-port="2" to-layer="531" to-port="0" /> + <edge from-layer="530" from-port="0" to-layer="531" to-port="1" /> + <edge from-layer="531" from-port="2" to-layer="533" to-port="0" /> + <edge from-layer="532" from-port="0" to-layer="533" to-port="1" /> + <edge from-layer="533" from-port="2" to-layer="534" to-port="0" /> + <edge from-layer="534" from-port="2" to-layer="536" to-port="0" /> + <edge from-layer="535" from-port="0" to-layer="536" to-port="1" /> + <edge from-layer="536" from-port="2" to-layer="538" to-port="0" /> + <edge from-layer="537" from-port="0" to-layer="538" to-port="1" /> + <edge from-layer="538" from-port="2" to-layer="540" to-port="0" /> + <edge from-layer="539" from-port="0" to-layer="540" to-port="1" /> + <edge from-layer="540" from-port="2" to-layer="542" to-port="0" /> + <edge from-layer="540" from-port="2" to-layer="550" to-port="1" /> + <edge from-layer="541" from-port="0" to-layer="542" to-port="1" /> + <edge from-layer="542" from-port="2" to-layer="544" to-port="0" /> + <edge from-layer="543" from-port="0" to-layer="544" to-port="1" /> + <edge from-layer="544" from-port="2" to-layer="545" to-port="0" /> + <edge from-layer="545" from-port="1" to-layer="547" to-port="0" /> + <edge from-layer="546" from-port="0" to-layer="547" to-port="1" /> + <edge from-layer="547" from-port="2" to-layer="549" to-port="0" /> + <edge from-layer="548" from-port="0" to-layer="549" to-port="1" /> + <edge from-layer="549" from-port="2" to-layer="550" to-port="0" /> + <edge from-layer="550" from-port="2" to-layer="552" to-port="0" /> + <edge from-layer="551" from-port="0" to-layer="552" to-port="1" /> + <edge from-layer="552" from-port="2" to-layer="554" to-port="0" /> + <edge from-layer="553" from-port="0" to-layer="554" to-port="1" /> + <edge from-layer="554" from-port="2" to-layer="556" to-port="0" /> + <edge from-layer="555" from-port="0" to-layer="556" to-port="1" /> + <edge from-layer="556" from-port="2" to-layer="590" to-port="1" /> + <edge from-layer="556" from-port="2" to-layer="574" to-port="0" /> + <edge from-layer="556" from-port="2" to-layer="566" to-port="0" /> + <edge from-layer="556" from-port="2" to-layer="558" to-port="0" /> + <edge from-layer="557" from-port="0" to-layer="558" to-port="1" /> + <edge from-layer="558" from-port="2" to-layer="560" to-port="0" /> + <edge from-layer="559" from-port="0" to-layer="560" to-port="1" /> + <edge from-layer="560" from-port="2" to-layer="562" to-port="0" /> + <edge from-layer="561" from-port="0" to-layer="562" to-port="1" /> + <edge from-layer="562" from-port="2" to-layer="564" to-port="0" /> + <edge from-layer="563" from-port="0" to-layer="564" to-port="1" /> + <edge from-layer="564" from-port="2" to-layer="581" to-port="0" /> + <edge from-layer="565" from-port="0" to-layer="566" to-port="1" /> + <edge from-layer="566" from-port="2" to-layer="568" to-port="0" /> + <edge from-layer="567" from-port="0" to-layer="568" to-port="1" /> + <edge from-layer="568" from-port="2" to-layer="570" to-port="0" /> + <edge from-layer="569" from-port="0" to-layer="570" to-port="1" /> + <edge from-layer="570" from-port="2" to-layer="572" to-port="0" /> + <edge from-layer="571" from-port="0" to-layer="572" to-port="1" /> + <edge from-layer="572" from-port="2" to-layer="581" to-port="1" /> + <edge from-layer="573" from-port="0" to-layer="574" to-port="1" /> + <edge from-layer="574" from-port="2" to-layer="576" to-port="0" /> + <edge from-layer="575" from-port="0" to-layer="576" to-port="1" /> + <edge from-layer="576" from-port="2" to-layer="578" to-port="0" /> + <edge from-layer="577" from-port="0" to-layer="578" to-port="1" /> + <edge from-layer="578" from-port="2" to-layer="580" to-port="0" /> + <edge from-layer="579" from-port="0" to-layer="580" to-port="1" /> + <edge from-layer="580" from-port="2" to-layer="581" to-port="2" /> + <edge from-layer="581" from-port="4" to-layer="583" to-port="0" /> + <edge from-layer="582" from-port="0" to-layer="583" to-port="1" /> + <edge from-layer="583" from-port="2" to-layer="585" to-port="0" /> + <edge from-layer="584" from-port="0" to-layer="585" to-port="1" /> + <edge from-layer="585" from-port="2" to-layer="587" to-port="0" /> + <edge from-layer="586" from-port="0" to-layer="587" to-port="1" /> + <edge from-layer="587" from-port="2" to-layer="589" to-port="0" /> + <edge from-layer="588" from-port="0" to-layer="589" to-port="1" /> + <edge from-layer="589" from-port="2" to-layer="590" to-port="0" /> + <edge from-layer="590" from-port="2" to-layer="592" to-port="0" /> + <edge from-layer="591" from-port="0" to-layer="592" to-port="1" /> + <edge from-layer="592" from-port="2" to-layer="594" to-port="0" /> + <edge from-layer="593" from-port="0" to-layer="594" to-port="1" /> + <edge from-layer="594" from-port="2" to-layer="596" to-port="0" /> + <edge from-layer="595" from-port="0" to-layer="596" to-port="1" /> + <edge from-layer="596" from-port="2" to-layer="598" to-port="0" /> + <edge from-layer="596" from-port="2" to-layer="606" to-port="1" /> + <edge from-layer="597" from-port="0" to-layer="598" to-port="1" /> + <edge from-layer="598" from-port="2" to-layer="600" to-port="0" /> + <edge from-layer="599" from-port="0" to-layer="600" to-port="1" /> + <edge from-layer="600" from-port="2" to-layer="601" to-port="0" /> + <edge from-layer="601" from-port="1" to-layer="603" to-port="0" /> + <edge from-layer="602" from-port="0" to-layer="603" to-port="1" /> + <edge from-layer="603" from-port="2" to-layer="605" to-port="0" /> + <edge from-layer="604" from-port="0" to-layer="605" to-port="1" /> + <edge from-layer="605" from-port="2" to-layer="606" to-port="0" /> + <edge from-layer="606" from-port="2" to-layer="608" to-port="0" /> + <edge from-layer="607" from-port="0" to-layer="608" to-port="1" /> + <edge from-layer="608" from-port="2" to-layer="610" to-port="0" /> + <edge from-layer="609" from-port="0" to-layer="610" to-port="1" /> + <edge from-layer="610" from-port="2" to-layer="612" to-port="0" /> + <edge from-layer="611" from-port="0" to-layer="612" to-port="1" /> + <edge from-layer="612" from-port="2" to-layer="646" to-port="1" /> + <edge from-layer="612" from-port="2" to-layer="630" to-port="0" /> + <edge from-layer="612" from-port="2" to-layer="622" to-port="0" /> + <edge from-layer="612" from-port="2" to-layer="614" to-port="0" /> + <edge from-layer="613" from-port="0" to-layer="614" to-port="1" /> + <edge from-layer="614" from-port="2" to-layer="616" to-port="0" /> + <edge from-layer="615" from-port="0" to-layer="616" to-port="1" /> + <edge from-layer="616" from-port="2" to-layer="618" to-port="0" /> + <edge from-layer="617" from-port="0" to-layer="618" to-port="1" /> + <edge from-layer="618" from-port="2" to-layer="620" to-port="0" /> + <edge from-layer="619" from-port="0" to-layer="620" to-port="1" /> + <edge from-layer="620" from-port="2" to-layer="637" to-port="0" /> + <edge from-layer="621" from-port="0" to-layer="622" to-port="1" /> + <edge from-layer="622" from-port="2" to-layer="624" to-port="0" /> + <edge from-layer="623" from-port="0" to-layer="624" to-port="1" /> + <edge from-layer="624" from-port="2" to-layer="626" to-port="0" /> + <edge from-layer="625" from-port="0" to-layer="626" to-port="1" /> + <edge from-layer="626" from-port="2" to-layer="628" to-port="0" /> + <edge from-layer="627" from-port="0" to-layer="628" to-port="1" /> + <edge from-layer="628" from-port="2" to-layer="637" to-port="1" /> + <edge from-layer="629" from-port="0" to-layer="630" to-port="1" /> + <edge from-layer="630" from-port="2" to-layer="632" to-port="0" /> + <edge from-layer="631" from-port="0" to-layer="632" to-port="1" /> + <edge from-layer="632" from-port="2" to-layer="634" to-port="0" /> + <edge from-layer="633" from-port="0" to-layer="634" to-port="1" /> + <edge from-layer="634" from-port="2" to-layer="636" to-port="0" /> + <edge from-layer="635" from-port="0" to-layer="636" to-port="1" /> + <edge from-layer="636" from-port="2" to-layer="637" to-port="2" /> + <edge from-layer="637" from-port="4" to-layer="639" to-port="0" /> + <edge from-layer="638" from-port="0" to-layer="639" to-port="1" /> + <edge from-layer="639" from-port="2" to-layer="641" to-port="0" /> + <edge from-layer="640" from-port="0" to-layer="641" to-port="1" /> + <edge from-layer="641" from-port="2" to-layer="643" to-port="0" /> + <edge from-layer="642" from-port="0" to-layer="643" to-port="1" /> + <edge from-layer="643" from-port="2" to-layer="645" to-port="0" /> + <edge from-layer="644" from-port="0" to-layer="645" to-port="1" /> + <edge from-layer="645" from-port="2" to-layer="646" to-port="0" /> + <edge from-layer="646" from-port="2" to-layer="648" to-port="0" /> + <edge from-layer="647" from-port="0" to-layer="648" to-port="1" /> + <edge from-layer="648" from-port="2" to-layer="650" to-port="0" /> + <edge from-layer="649" from-port="0" to-layer="650" to-port="1" /> + <edge from-layer="650" from-port="2" to-layer="652" to-port="0" /> + <edge from-layer="651" from-port="0" to-layer="652" to-port="1" /> + <edge from-layer="652" from-port="2" to-layer="654" to-port="0" /> + <edge from-layer="652" from-port="2" to-layer="662" to-port="1" /> + <edge from-layer="653" from-port="0" to-layer="654" to-port="1" /> + <edge from-layer="654" from-port="2" to-layer="656" to-port="0" /> + <edge from-layer="655" from-port="0" to-layer="656" to-port="1" /> + <edge from-layer="656" from-port="2" to-layer="657" to-port="0" /> + <edge from-layer="657" from-port="1" to-layer="659" to-port="0" /> + <edge from-layer="658" from-port="0" to-layer="659" to-port="1" /> + <edge from-layer="659" from-port="2" to-layer="661" to-port="0" /> + <edge from-layer="660" from-port="0" to-layer="661" to-port="1" /> + <edge from-layer="661" from-port="2" to-layer="662" to-port="0" /> + <edge from-layer="662" from-port="2" to-layer="664" to-port="0" /> + <edge from-layer="663" from-port="0" to-layer="664" to-port="1" /> + <edge from-layer="664" from-port="2" to-layer="666" to-port="0" /> + <edge from-layer="665" from-port="0" to-layer="666" to-port="1" /> + <edge from-layer="666" from-port="2" to-layer="668" to-port="0" /> + <edge from-layer="667" from-port="0" to-layer="668" to-port="1" /> + <edge from-layer="668" from-port="2" to-layer="702" to-port="1" /> + <edge from-layer="668" from-port="2" to-layer="686" to-port="0" /> + <edge from-layer="668" from-port="2" to-layer="678" to-port="0" /> + <edge from-layer="668" from-port="2" to-layer="670" to-port="0" /> + <edge from-layer="669" from-port="0" to-layer="670" to-port="1" /> + <edge from-layer="670" from-port="2" to-layer="672" to-port="0" /> + <edge from-layer="671" from-port="0" to-layer="672" to-port="1" /> + <edge from-layer="672" from-port="2" to-layer="674" to-port="0" /> + <edge from-layer="673" from-port="0" to-layer="674" to-port="1" /> + <edge from-layer="674" from-port="2" to-layer="676" to-port="0" /> + <edge from-layer="675" from-port="0" to-layer="676" to-port="1" /> + <edge from-layer="676" from-port="2" to-layer="693" to-port="0" /> + <edge from-layer="677" from-port="0" to-layer="678" to-port="1" /> + <edge from-layer="678" from-port="2" to-layer="680" to-port="0" /> + <edge from-layer="679" from-port="0" to-layer="680" to-port="1" /> + <edge from-layer="680" from-port="2" to-layer="682" to-port="0" /> + <edge from-layer="681" from-port="0" to-layer="682" to-port="1" /> + <edge from-layer="682" from-port="2" to-layer="684" to-port="0" /> + <edge from-layer="683" from-port="0" to-layer="684" to-port="1" /> + <edge from-layer="684" from-port="2" to-layer="693" to-port="1" /> + <edge from-layer="685" from-port="0" to-layer="686" to-port="1" /> + <edge from-layer="686" from-port="2" to-layer="688" to-port="0" /> + <edge from-layer="687" from-port="0" to-layer="688" to-port="1" /> + <edge from-layer="688" from-port="2" to-layer="690" to-port="0" /> + <edge from-layer="689" from-port="0" to-layer="690" to-port="1" /> + <edge from-layer="690" from-port="2" to-layer="692" to-port="0" /> + <edge from-layer="691" from-port="0" to-layer="692" to-port="1" /> + <edge from-layer="692" from-port="2" to-layer="693" to-port="2" /> + <edge from-layer="693" from-port="4" to-layer="695" to-port="0" /> + <edge from-layer="694" from-port="0" to-layer="695" to-port="1" /> + <edge from-layer="695" from-port="2" to-layer="697" to-port="0" /> + <edge from-layer="696" from-port="0" to-layer="697" to-port="1" /> + <edge from-layer="697" from-port="2" to-layer="699" to-port="0" /> + <edge from-layer="698" from-port="0" to-layer="699" to-port="1" /> + <edge from-layer="699" from-port="2" to-layer="701" to-port="0" /> + <edge from-layer="700" from-port="0" to-layer="701" to-port="1" /> + <edge from-layer="701" from-port="2" to-layer="702" to-port="0" /> + <edge from-layer="702" from-port="2" to-layer="704" to-port="0" /> + <edge from-layer="703" from-port="0" to-layer="704" to-port="1" /> + <edge from-layer="704" from-port="2" to-layer="706" to-port="0" /> + <edge from-layer="705" from-port="0" to-layer="706" to-port="1" /> + <edge from-layer="706" from-port="2" to-layer="708" to-port="0" /> + <edge from-layer="707" from-port="0" to-layer="708" to-port="1" /> + <edge from-layer="708" from-port="2" to-layer="710" to-port="0" /> + <edge from-layer="708" from-port="2" to-layer="718" to-port="1" /> + <edge from-layer="709" from-port="0" to-layer="710" to-port="1" /> + <edge from-layer="710" from-port="2" to-layer="712" to-port="0" /> + <edge from-layer="711" from-port="0" to-layer="712" to-port="1" /> + <edge from-layer="712" from-port="2" to-layer="713" to-port="0" /> + <edge from-layer="713" from-port="1" to-layer="715" to-port="0" /> + <edge from-layer="714" from-port="0" to-layer="715" to-port="1" /> + <edge from-layer="715" from-port="2" to-layer="717" to-port="0" /> + <edge from-layer="716" from-port="0" to-layer="717" to-port="1" /> + <edge from-layer="717" from-port="2" to-layer="718" to-port="0" /> + <edge from-layer="718" from-port="2" to-layer="720" to-port="0" /> + <edge from-layer="719" from-port="0" to-layer="720" to-port="1" /> + <edge from-layer="720" from-port="2" to-layer="722" to-port="0" /> + <edge from-layer="721" from-port="0" to-layer="722" to-port="1" /> + <edge from-layer="722" from-port="2" to-layer="724" to-port="0" /> + <edge from-layer="723" from-port="0" to-layer="724" to-port="1" /> + <edge from-layer="724" from-port="2" to-layer="725" to-port="0" /> + </edges> + <rt_info> + <Runtime_version value="2024.4.1-16618-643f23d1318-releases/2024/4" /> + <conversion_parameters> + <framework value="pytorch" /> + <is_python_object value="True" /> + </conversion_parameters> + <optimum> + <optimum_intel_version value="1.20.1" /> + <optimum_version value="1.23.3" /> + <pytorch_version value="2.5.1" /> + <transformers_version value="4.46.2" /> + </optimum> + </rt_info> +</net>