<?xml version="1.0"?> <net name="Model3" version="11"> <layers> <layer id="3" name="decoder_input_ids" type="Parameter" version="opset1"> <data shape="?,?" element_type="i64" /> <output> <port id="0" precision="I64" names="input_ids"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2" name="Parameter_33105" type="Parameter" version="opset1"> <data shape="?,?,1024" element_type="f32" /> <output> <port id="0" precision="FP32" names="encoder_hidden_states"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1" name="cache_position" type="Parameter" version="opset1"> <data shape="?" element_type="i64" /> <output> <port id="0" precision="I64" names="cache_position"> <dim>-1</dim> </port> </output> </layer> <layer id="0" name="beam_idx" type="Parameter" version="opset1"> <data shape="?" element_type="i32" /> <output> <port id="0" precision="I32" names="beam_idx"> <dim>-1</dim> </port> </output> </layer> <layer id="4" name="self.model.model.decoder.layers.16.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="0" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5" name="Convert_920016" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="6" name="self.model.model.decoder.layers.16.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="524288" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="7" name="Convert_920019" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="8" name="self.model.model.decoder.layers.16.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="9" name="self.model.model.decoder.layers.16.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="528384" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="10" name="self.model.model.decoder.layers.16.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="11" name="Constant_920024" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="12" name="Reshape_920025" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="13" name="self.model.model.decoder.layers.16.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="14" name="__module.model.model.decoder.layers.16.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="15" name="Constant_54747" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="544784" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="16" name="__module.model.model.decoder.layers.16.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2266,tensor.203"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="17" name="Constant_58091" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="18" name="__module.model.model.decoder.layers.16.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2268"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="19" name="__module.model.model.decoder.layers.16.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="20" name="__module.model.model.decoder.layers.16.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2269"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="21" name="ReadValue_61573" type="ReadValue" version="opset6"> <data variable_id="2269" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="23" name="self.model.model.decoder.layers.17.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="548928" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="24" name="Convert_924315" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="25" name="self.model.model.decoder.layers.17.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="1073216" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="26" name="Convert_924318" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="27" name="self.model.model.decoder.layers.17.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="28" name="self.model.model.decoder.layers.17.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="1077312" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="29" name="self.model.model.decoder.layers.17.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="30" name="Constant_924323" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="31" name="Reshape_924324" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="32" name="self.model.model.decoder.layers.17.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="33" name="__module.model.model.decoder.layers.17.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2375,tensor.213"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="34" name="Constant_58098" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="35" name="__module.model.model.decoder.layers.17.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2377"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="36" name="__module.model.model.decoder.layers.17.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="37" name="__module.model.model.decoder.layers.17.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2378"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="38" name="ReadValue_61571" type="ReadValue" version="opset6"> <data variable_id="2378" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="40" name="self.model.model.decoder.layers.8.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="1093696" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="41" name="Convert_928614" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="42" name="self.model.model.decoder.layers.8.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="1617984" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="43" name="Convert_928617" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="44" name="self.model.model.decoder.layers.8.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="45" name="self.model.model.decoder.layers.8.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="1622080" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="46" name="self.model.model.decoder.layers.8.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="47" name="Constant_928622" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="48" name="Reshape_928623" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="49" name="self.model.model.decoder.layers.8.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="50" name="__module.model.model.decoder.layers.8.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="51" name="Constant_54635" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="1638464" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="52" name="__module.model.model.decoder.layers.8.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1338,tensor.107"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="53" name="Constant_58027" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="54" name="__module.model.model.decoder.layers.8.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1340"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="55" name="__module.model.model.decoder.layers.8.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="56" name="__module.model.model.decoder.layers.8.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1341"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="57" name="ReadValue_61569" type="ReadValue" version="opset6"> <data variable_id="1341" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="59" name="self.model.model.decoder.layers.16.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="1642560" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="60" name="Convert_932913" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="61" name="self.model.model.decoder.layers.16.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="2166848" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="62" name="Convert_932916" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="63" name="self.model.model.decoder.layers.16.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="64" name="self.model.model.decoder.layers.16.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="2170944" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="65" name="self.model.model.decoder.layers.16.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="66" name="Constant_932921" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="67" name="Reshape_932922" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="68" name="self.model.model.decoder.layers.16.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="69" name="__module.model.model.decoder.layers.16.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2259,tensor.201"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="70" name="Constant_58090" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="71" name="__module.model.model.decoder.layers.16.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2261"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="72" name="__module.model.model.decoder.layers.16.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="73" name="__module.model.model.decoder.layers.16.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2262"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="74" name="ReadValue_61567" type="ReadValue" version="opset6"> <data variable_id="2262" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="76" name="self.model.model.decoder.layers.15.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="2187328" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="77" name="Convert_937212" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="78" name="self.model.model.decoder.layers.15.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="2711616" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="79" name="Convert_937215" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="80" name="self.model.model.decoder.layers.15.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="81" name="self.model.model.decoder.layers.15.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="2715712" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="82" name="self.model.model.decoder.layers.15.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="83" name="Constant_937220" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="84" name="Reshape_937221" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="85" name="self.model.model.decoder.layers.15.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="86" name="__module.model.model.decoder.layers.15.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="87" name="Constant_54733" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="2732096" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="88" name="__module.model.model.decoder.layers.15.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2150,tensor.191"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="89" name="Constant_58083" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="90" name="__module.model.model.decoder.layers.15.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2152"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="91" name="__module.model.model.decoder.layers.15.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="92" name="__module.model.model.decoder.layers.15.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2153"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="93" name="ReadValue_61565" type="ReadValue" version="opset6"> <data variable_id="2153" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="95" name="self.model.model.decoder.layers.7.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="2736192" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="96" name="Convert_941511" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="97" name="self.model.model.decoder.layers.7.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="3260480" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="98" name="Convert_941514" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="99" name="self.model.model.decoder.layers.7.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="100" name="self.model.model.decoder.layers.7.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="3264576" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="101" name="self.model.model.decoder.layers.7.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="102" name="Constant_941519" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="103" name="Reshape_941520" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="104" name="self.model.model.decoder.layers.7.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="105" name="__module.model.model.decoder.layers.7.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="106" name="Constant_54621" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="3280960" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="107" name="__module.model.model.decoder.layers.7.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1222,tensor.95"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="108" name="Constant_58019" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="109" name="__module.model.model.decoder.layers.7.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1224"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="110" name="__module.model.model.decoder.layers.7.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="111" name="__module.model.model.decoder.layers.7.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1225"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="112" name="ReadValue_61563" type="ReadValue" version="opset6"> <data variable_id="1225" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="114" name="self.model.model.decoder.layers.8.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="3285056" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="115" name="Convert_945810" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="116" name="self.model.model.decoder.layers.8.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="3809344" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="117" name="Convert_945813" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="118" name="self.model.model.decoder.layers.8.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="119" name="self.model.model.decoder.layers.8.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="3813440" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="120" name="self.model.model.decoder.layers.8.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="121" name="Constant_945818" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="122" name="Reshape_945819" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="123" name="self.model.model.decoder.layers.8.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="124" name="__module.model.model.decoder.layers.8.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1331,tensor.105"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="125" name="Constant_58026" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="126" name="__module.model.model.decoder.layers.8.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1333"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="127" name="__module.model.model.decoder.layers.8.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="128" name="__module.model.model.decoder.layers.8.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1334"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="129" name="ReadValue_61561" type="ReadValue" version="opset6"> <data variable_id="1334" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="131" name="self.model.model.decoder.layers.14.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="3829824" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="132" name="Convert_950109" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="133" name="self.model.model.decoder.layers.14.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="4354112" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="134" name="Convert_950112" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="135" name="self.model.model.decoder.layers.14.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="136" name="self.model.model.decoder.layers.14.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="4358208" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="137" name="self.model.model.decoder.layers.14.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="138" name="Constant_950117" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="139" name="Reshape_950118" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="140" name="self.model.model.decoder.layers.14.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="141" name="__module.model.model.decoder.layers.14.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="142" name="Constant_54719" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="4374592" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="143" name="__module.model.model.decoder.layers.14.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2034,tensor.179"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="144" name="Constant_58075" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="145" name="__module.model.model.decoder.layers.14.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2036"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="146" name="__module.model.model.decoder.layers.14.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="147" name="__module.model.model.decoder.layers.14.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2037"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="148" name="ReadValue_61559" type="ReadValue" version="opset6"> <data variable_id="2037" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="150" name="self.model.model.decoder.layers.15.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="4378688" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="151" name="Convert_954408" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="152" name="self.model.model.decoder.layers.15.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="4902976" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="153" name="Convert_954411" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="154" name="self.model.model.decoder.layers.15.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="155" name="self.model.model.decoder.layers.15.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="4907072" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="156" name="self.model.model.decoder.layers.15.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="157" name="Constant_954416" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="158" name="Reshape_954417" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="159" name="self.model.model.decoder.layers.15.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="160" name="__module.model.model.decoder.layers.15.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2143,tensor.189"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="161" name="Constant_58082" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="162" name="__module.model.model.decoder.layers.15.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2145"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="163" name="__module.model.model.decoder.layers.15.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="164" name="__module.model.model.decoder.layers.15.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2146"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="165" name="ReadValue_61557" type="ReadValue" version="opset6"> <data variable_id="2146" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="167" name="self.model.model.decoder.layers.7.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="4923456" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="168" name="Convert_958707" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="169" name="self.model.model.decoder.layers.7.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="5447744" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="170" name="Convert_958710" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="171" name="self.model.model.decoder.layers.7.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="172" name="self.model.model.decoder.layers.7.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="5451840" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="173" name="self.model.model.decoder.layers.7.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="174" name="Constant_958715" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="175" name="Reshape_958716" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="176" name="self.model.model.decoder.layers.7.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="177" name="__module.model.model.decoder.layers.7.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1215,tensor.93"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="178" name="Constant_58018" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="179" name="__module.model.model.decoder.layers.7.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1217"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="180" name="__module.model.model.decoder.layers.7.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="181" name="__module.model.model.decoder.layers.7.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1218"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="182" name="ReadValue_61555" type="ReadValue" version="opset6"> <data variable_id="1218" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="184" name="self.model.model.decoder.layers.23.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="5468224" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="185" name="Convert_963006" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="186" name="self.model.model.decoder.layers.23.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="5992512" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="187" name="Convert_963009" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="188" name="self.model.model.decoder.layers.23.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="189" name="self.model.model.decoder.layers.23.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="5996608" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="190" name="self.model.model.decoder.layers.23.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="191" name="Constant_963014" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="192" name="Reshape_963015" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="193" name="self.model.model.decoder.layers.23.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="194" name="__module.model.model.decoder.layers.23.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="195" name="Constant_54845" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="6012992" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="196" name="__module.model.model.decoder.layers.23.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3078,tensor"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="197" name="Constant_58147" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="198" name="__module.model.model.decoder.layers.23.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3080"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="199" name="__module.model.model.decoder.layers.23.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="200" name="__module.model.model.decoder.layers.23.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3081"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="201" name="ReadValue_61553" type="ReadValue" version="opset6"> <data variable_id="3081" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="203" name="self.model.model.decoder.layers.14.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="6017088" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="204" name="Convert_967305" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="205" name="self.model.model.decoder.layers.14.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="6541376" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="206" name="Convert_967308" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="207" name="self.model.model.decoder.layers.14.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="208" name="self.model.model.decoder.layers.14.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="6545472" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="209" name="self.model.model.decoder.layers.14.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="210" name="Constant_967313" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="211" name="Reshape_967314" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="212" name="self.model.model.decoder.layers.14.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="213" name="__module.model.model.decoder.layers.14.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2027,tensor.177"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="214" name="Constant_58074" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="215" name="__module.model.model.decoder.layers.14.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2029"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="216" name="__module.model.model.decoder.layers.14.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="217" name="__module.model.model.decoder.layers.14.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2030"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="218" name="ReadValue_61551" type="ReadValue" version="opset6"> <data variable_id="2030" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="220" name="self.model.model.decoder.layers.6.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="6561856" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="221" name="Convert_971604" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="222" name="self.model.model.decoder.layers.6.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="7086144" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="223" name="Convert_971607" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="224" name="self.model.model.decoder.layers.6.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="225" name="self.model.model.decoder.layers.6.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="7090240" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="226" name="self.model.model.decoder.layers.6.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="227" name="Constant_971612" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="228" name="Reshape_971613" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="229" name="self.model.model.decoder.layers.6.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="230" name="__module.model.model.decoder.layers.6.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="231" name="Constant_54607" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="7106624" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="232" name="__module.model.model.decoder.layers.6.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1106,tensor.83"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="233" name="Constant_58011" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="234" name="__module.model.model.decoder.layers.6.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1108"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="235" name="__module.model.model.decoder.layers.6.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="236" name="__module.model.model.decoder.layers.6.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1109"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="237" name="ReadValue_61549" type="ReadValue" version="opset6"> <data variable_id="1109" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="239" name="self.model.model.decoder.layers.13.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="7110720" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="240" name="Convert_975903" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="241" name="self.model.model.decoder.layers.13.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="7635008" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="242" name="Convert_975906" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="243" name="self.model.model.decoder.layers.13.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="244" name="self.model.model.decoder.layers.13.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="7639104" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="245" name="self.model.model.decoder.layers.13.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="246" name="Constant_975911" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="247" name="Reshape_975912" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="248" name="self.model.model.decoder.layers.13.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="249" name="__module.model.model.decoder.layers.13.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="250" name="Constant_54705" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="7655488" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="251" name="__module.model.model.decoder.layers.13.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1918,tensor.167"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="252" name="Constant_58067" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="253" name="__module.model.model.decoder.layers.13.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1920"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="254" name="__module.model.model.decoder.layers.13.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="255" name="__module.model.model.decoder.layers.13.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1921"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="256" name="ReadValue_61547" type="ReadValue" version="opset6"> <data variable_id="1921" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="258" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="7659584" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="259" name="Convert_980202" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="260" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="8183872" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="261" name="Convert_980205" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="262" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="263" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="8187968" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="264" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="265" name="Constant_980210" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="266" name="Reshape_980211" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="267" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="268" name="__module.model.model.decoder.layers.0.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="269" name="Constant_54523" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="8204352" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="270" name="__module.model.model.decoder.layers.0.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="410,tensor.11"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="271" name="Constant_57963" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="272" name="__module.model.model.decoder.layers.0.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="412"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="273" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="274" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="413"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="275" name="ReadValue_61545" type="ReadValue" version="opset6"> <data variable_id="413" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="277" name="self.model.model.decoder.layers.23.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="8208448" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="278" name="Convert_984501" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="279" name="self.model.model.decoder.layers.23.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="8732736" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="280" name="Convert_984504" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="281" name="self.model.model.decoder.layers.23.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="282" name="self.model.model.decoder.layers.23.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="8736832" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="283" name="self.model.model.decoder.layers.23.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="284" name="Constant_984509" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="285" name="Reshape_984510" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="286" name="self.model.model.decoder.layers.23.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="287" name="__module.model.model.decoder.layers.23.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3071,tensor.285"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="288" name="Constant_58146" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="289" name="__module.model.model.decoder.layers.23.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3073"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="290" name="__module.model.model.decoder.layers.23.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="291" name="__module.model.model.decoder.layers.23.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3074"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="292" name="ReadValue_61543" type="ReadValue" version="opset6"> <data variable_id="3074" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="294" name="self.model.model.decoder.layers.6.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="8753216" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="295" name="Convert_988800" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="296" name="self.model.model.decoder.layers.6.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="9277504" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="297" name="Convert_988803" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="298" name="self.model.model.decoder.layers.6.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="299" name="self.model.model.decoder.layers.6.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="9281600" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="300" name="self.model.model.decoder.layers.6.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="301" name="Constant_988808" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="302" name="Reshape_988809" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="303" name="self.model.model.decoder.layers.6.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="304" name="__module.model.model.decoder.layers.6.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1099,tensor.81"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="305" name="Constant_58010" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="306" name="__module.model.model.decoder.layers.6.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1101"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="307" name="__module.model.model.decoder.layers.6.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="308" name="__module.model.model.decoder.layers.6.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1102"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="309" name="ReadValue_61541" type="ReadValue" version="opset6"> <data variable_id="1102" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="311" name="self.model.model.decoder.layers.13.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="9297984" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="312" name="Convert_993099" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="313" name="self.model.model.decoder.layers.13.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="9822272" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="314" name="Convert_993102" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="315" name="self.model.model.decoder.layers.13.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="316" name="self.model.model.decoder.layers.13.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="9826368" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="317" name="self.model.model.decoder.layers.13.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="318" name="Constant_993107" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="319" name="Reshape_993108" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="320" name="self.model.model.decoder.layers.13.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="321" name="__module.model.model.decoder.layers.13.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1911,tensor.165"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="322" name="Constant_58066" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="323" name="__module.model.model.decoder.layers.13.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1913"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="324" name="__module.model.model.decoder.layers.13.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="325" name="__module.model.model.decoder.layers.13.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1914"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="326" name="ReadValue_61539" type="ReadValue" version="opset6"> <data variable_id="1914" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="328" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="9842752" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="329" name="Convert_997398" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="330" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="10367040" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="331" name="Convert_997401" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="332" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="333" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="10371136" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="334" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="335" name="Constant_997406" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="336" name="Reshape_997407" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="337" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="338" name="__module.model.model.decoder.layers.0.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="403,tensor.9"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="339" name="Constant_57962" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="340" name="__module.model.model.decoder.layers.0.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="405"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="341" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="342" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="406"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="343" name="ReadValue_61537" type="ReadValue" version="opset6"> <data variable_id="406" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="345" name="self.model.model.decoder.layers.5.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="10387520" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="346" name="Convert_1001697" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="347" name="self.model.model.decoder.layers.5.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="10911808" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="348" name="Convert_1001700" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="349" name="self.model.model.decoder.layers.5.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="350" name="self.model.model.decoder.layers.5.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="10915904" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="351" name="self.model.model.decoder.layers.5.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="352" name="Constant_1001705" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="353" name="Reshape_1001706" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="354" name="self.model.model.decoder.layers.5.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="355" name="__module.model.model.decoder.layers.5.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="356" name="Constant_54593" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="10932288" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="357" name="__module.model.model.decoder.layers.5.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="990,tensor.71"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="358" name="Constant_58003" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="359" name="__module.model.model.decoder.layers.5.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="992"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="360" name="__module.model.model.decoder.layers.5.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="361" name="__module.model.model.decoder.layers.5.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="993"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="362" name="ReadValue_61535" type="ReadValue" version="opset6"> <data variable_id="993" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="364" name="self.model.model.decoder.layers.12.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="10936384" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="365" name="Convert_1005996" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="366" name="self.model.model.decoder.layers.12.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="11460672" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="367" name="Convert_1005999" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="368" name="self.model.model.decoder.layers.12.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="369" name="self.model.model.decoder.layers.12.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="11464768" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="370" name="self.model.model.decoder.layers.12.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="371" name="Constant_1006004" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="372" name="Reshape_1006005" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="373" name="self.model.model.decoder.layers.12.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="374" name="__module.model.model.decoder.layers.12.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="375" name="Constant_54691" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="11481152" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="376" name="__module.model.model.decoder.layers.12.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1802,tensor.155"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="377" name="Constant_58059" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="378" name="__module.model.model.decoder.layers.12.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1804"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="379" name="__module.model.model.decoder.layers.12.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="380" name="__module.model.model.decoder.layers.12.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1805"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="381" name="ReadValue_61533" type="ReadValue" version="opset6"> <data variable_id="1805" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="383" name="self.model.model.decoder.layers.5.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="11485248" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="384" name="Convert_1010295" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="385" name="self.model.model.decoder.layers.5.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="12009536" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="386" name="Convert_1010298" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="387" name="self.model.model.decoder.layers.5.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="388" name="self.model.model.decoder.layers.5.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="12013632" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="389" name="self.model.model.decoder.layers.5.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="390" name="Constant_1010303" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="391" name="Reshape_1010304" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="392" name="self.model.model.decoder.layers.5.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="393" name="__module.model.model.decoder.layers.5.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="983,tensor.69"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="394" name="Constant_58002" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="395" name="__module.model.model.decoder.layers.5.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="985"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="396" name="__module.model.model.decoder.layers.5.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="397" name="__module.model.model.decoder.layers.5.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="986"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="398" name="ReadValue_61531" type="ReadValue" version="opset6"> <data variable_id="986" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="400" name="self.model.model.decoder.layers.12.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="12030016" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="401" name="Convert_1014594" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="402" name="self.model.model.decoder.layers.12.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="12554304" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="403" name="Convert_1014597" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="404" name="self.model.model.decoder.layers.12.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="405" name="self.model.model.decoder.layers.12.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="12558400" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="406" name="self.model.model.decoder.layers.12.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="407" name="Constant_1014602" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="408" name="Reshape_1014603" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="409" name="self.model.model.decoder.layers.12.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="410" name="__module.model.model.decoder.layers.12.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1795,tensor.153"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="411" name="Constant_58058" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="412" name="__module.model.model.decoder.layers.12.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1797"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="413" name="__module.model.model.decoder.layers.12.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="414" name="__module.model.model.decoder.layers.12.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1798"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="415" name="ReadValue_61529" type="ReadValue" version="opset6"> <data variable_id="1798" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="417" name="self.model.model.decoder.layers.4.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="12574784" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="418" name="Convert_1018893" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="419" name="self.model.model.decoder.layers.4.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="13099072" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="420" name="Convert_1018896" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="421" name="self.model.model.decoder.layers.4.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="422" name="self.model.model.decoder.layers.4.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="13103168" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="423" name="self.model.model.decoder.layers.4.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="424" name="Constant_1018901" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="425" name="Reshape_1018902" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="426" name="self.model.model.decoder.layers.4.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="427" name="__module.model.model.decoder.layers.4.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="428" name="Constant_54579" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="13119552" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="429" name="__module.model.model.decoder.layers.4.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="874,tensor.59"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="430" name="Constant_57995" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="431" name="__module.model.model.decoder.layers.4.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="876"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="432" name="__module.model.model.decoder.layers.4.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="433" name="__module.model.model.decoder.layers.4.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="877"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="434" name="ReadValue_61527" type="ReadValue" version="opset6"> <data variable_id="877" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="436" name="self.model.model.decoder.layers.22.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="13123648" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="437" name="Convert_1023192" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="438" name="self.model.model.decoder.layers.22.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="13647936" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="439" name="Convert_1023195" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="440" name="self.model.model.decoder.layers.22.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="441" name="self.model.model.decoder.layers.22.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="13652032" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="442" name="self.model.model.decoder.layers.22.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="443" name="Constant_1023200" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="444" name="Reshape_1023201" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="445" name="self.model.model.decoder.layers.22.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="446" name="__module.model.model.decoder.layers.22.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="447" name="Constant_54831" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="13668416" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="448" name="__module.model.model.decoder.layers.22.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2962,tensor.275"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="449" name="Constant_58139" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="450" name="__module.model.model.decoder.layers.22.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2964"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="451" name="__module.model.model.decoder.layers.22.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="452" name="__module.model.model.decoder.layers.22.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2965"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="453" name="ReadValue_61525" type="ReadValue" version="opset6"> <data variable_id="2965" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="455" name="self.model.model.decoder.layers.11.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="13672512" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="456" name="Convert_1027491" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="457" name="self.model.model.decoder.layers.11.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="14196800" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="458" name="Convert_1027494" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="459" name="self.model.model.decoder.layers.11.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="460" name="self.model.model.decoder.layers.11.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="14200896" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="461" name="self.model.model.decoder.layers.11.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="462" name="Constant_1027499" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="463" name="Reshape_1027500" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="464" name="self.model.model.decoder.layers.11.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="465" name="__module.model.model.decoder.layers.11.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="466" name="Constant_54677" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="14217280" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="467" name="__module.model.model.decoder.layers.11.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1686,tensor.143"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="468" name="Constant_58051" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="469" name="__module.model.model.decoder.layers.11.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1688"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="470" name="__module.model.model.decoder.layers.11.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="471" name="__module.model.model.decoder.layers.11.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1689"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="472" name="ReadValue_61523" type="ReadValue" version="opset6"> <data variable_id="1689" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="474" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="14221376" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="475" name="Convert_1031790" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="476" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="14745664" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="477" name="Convert_1031793" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="478" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="479" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="14749760" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="480" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="481" name="Constant_1031798" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="482" name="Reshape_1031799" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="483" name="self.model.model.decoder.layers.3.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="484" name="__module.model.model.decoder.layers.3.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="485" name="Constant_54565" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="14766144" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="486" name="__module.model.model.decoder.layers.3.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="758,tensor.47"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="487" name="Constant_57987" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="488" name="__module.model.model.decoder.layers.3.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="760"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="489" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="490" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="761"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="491" name="ReadValue_61521" type="ReadValue" version="opset6"> <data variable_id="761" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="493" name="self.model.model.decoder.layers.21.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="14770240" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="494" name="Convert_1036089" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="495" name="self.model.model.decoder.layers.21.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="15294528" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="496" name="Convert_1036092" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="497" name="self.model.model.decoder.layers.21.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="498" name="self.model.model.decoder.layers.21.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="15298624" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="499" name="self.model.model.decoder.layers.21.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="500" name="Constant_1036097" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="501" name="Reshape_1036098" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="502" name="self.model.model.decoder.layers.21.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="503" name="__module.model.model.decoder.layers.21.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="504" name="Constant_54817" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="15315008" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="505" name="__module.model.model.decoder.layers.21.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2846,tensor.263"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="506" name="Constant_58131" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="507" name="__module.model.model.decoder.layers.21.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2848"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="508" name="__module.model.model.decoder.layers.21.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="509" name="__module.model.model.decoder.layers.21.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2849"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="510" name="ReadValue_61519" type="ReadValue" version="opset6"> <data variable_id="2849" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="512" name="self.model.model.decoder.layers.4.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="15319104" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="513" name="Convert_1040388" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="514" name="self.model.model.decoder.layers.4.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="15843392" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="515" name="Convert_1040391" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="516" name="self.model.model.decoder.layers.4.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="517" name="self.model.model.decoder.layers.4.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="15847488" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="518" name="self.model.model.decoder.layers.4.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="519" name="Constant_1040396" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="520" name="Reshape_1040397" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="521" name="self.model.model.decoder.layers.4.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="522" name="__module.model.model.decoder.layers.4.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="867,tensor.57"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="523" name="Constant_57994" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="524" name="__module.model.model.decoder.layers.4.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="869"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="525" name="__module.model.model.decoder.layers.4.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="526" name="__module.model.model.decoder.layers.4.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="870"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="527" name="ReadValue_61517" type="ReadValue" version="opset6"> <data variable_id="870" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="529" name="self.model.model.decoder.layers.22.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="15863872" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="530" name="Convert_1044687" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="531" name="self.model.model.decoder.layers.22.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="16388160" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="532" name="Convert_1044690" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="533" name="self.model.model.decoder.layers.22.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="534" name="self.model.model.decoder.layers.22.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="16392256" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="535" name="self.model.model.decoder.layers.22.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="536" name="Constant_1044695" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="537" name="Reshape_1044696" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="538" name="self.model.model.decoder.layers.22.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="539" name="__module.model.model.decoder.layers.22.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2955,tensor.273"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="540" name="Constant_58138" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="541" name="__module.model.model.decoder.layers.22.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2957"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="542" name="__module.model.model.decoder.layers.22.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="543" name="__module.model.model.decoder.layers.22.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2958"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="544" name="ReadValue_61515" type="ReadValue" version="opset6"> <data variable_id="2958" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="546" name="self.model.model.decoder.layers.11.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="16408640" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="547" name="Convert_1048986" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="548" name="self.model.model.decoder.layers.11.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="16932928" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="549" name="Convert_1048989" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="550" name="self.model.model.decoder.layers.11.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="551" name="self.model.model.decoder.layers.11.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="16937024" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="552" name="self.model.model.decoder.layers.11.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="553" name="Constant_1048994" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="554" name="Reshape_1048995" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="555" name="self.model.model.decoder.layers.11.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="556" name="__module.model.model.decoder.layers.11.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1679,tensor.141"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="557" name="Constant_58050" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="558" name="__module.model.model.decoder.layers.11.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1681"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="559" name="__module.model.model.decoder.layers.11.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="560" name="__module.model.model.decoder.layers.11.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1682"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="561" name="ReadValue_61513" type="ReadValue" version="opset6"> <data variable_id="1682" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="563" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="16953408" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="564" name="Convert_1053285" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="565" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="17477696" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="566" name="Convert_1053288" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="567" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="568" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="17481792" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="569" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="570" name="Constant_1053293" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="571" name="Reshape_1053294" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="572" name="self.model.model.decoder.layers.2.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="573" name="__module.model.model.decoder.layers.2.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="574" name="Constant_54551" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="17498176" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="575" name="__module.model.model.decoder.layers.2.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="642,tensor.35"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="576" name="Constant_57979" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="577" name="__module.model.model.decoder.layers.2.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="644"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="578" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="579" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="645"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="580" name="ReadValue_61511" type="ReadValue" version="opset6"> <data variable_id="645" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="582" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="17502272" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="583" name="Convert_1057584" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="584" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="18026560" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="585" name="Convert_1057587" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="586" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="587" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="18030656" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="588" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="589" name="Constant_1057592" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="590" name="Reshape_1057593" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="591" name="self.model.model.decoder.layers.3.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="592" name="__module.model.model.decoder.layers.3.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="751,tensor.45"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="593" name="Constant_57986" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="594" name="__module.model.model.decoder.layers.3.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="753"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="595" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="596" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="754"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="597" name="ReadValue_61509" type="ReadValue" version="opset6"> <data variable_id="754" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="599" name="self.model.model.decoder.layers.21.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="18047040" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="600" name="Convert_1061883" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="601" name="self.model.model.decoder.layers.21.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="18571328" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="602" name="Convert_1061886" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="603" name="self.model.model.decoder.layers.21.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="604" name="self.model.model.decoder.layers.21.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="18575424" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="605" name="self.model.model.decoder.layers.21.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="606" name="Constant_1061891" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="607" name="Reshape_1061892" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="608" name="self.model.model.decoder.layers.21.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="609" name="__module.model.model.decoder.layers.21.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2839,tensor.261"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="610" name="Constant_58130" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="611" name="__module.model.model.decoder.layers.21.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2841"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="612" name="__module.model.model.decoder.layers.21.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="613" name="__module.model.model.decoder.layers.21.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2842"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="614" name="ReadValue_61507" type="ReadValue" version="opset6"> <data variable_id="2842" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="616" name="self.model.model.decoder.layers.20.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="18591808" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="617" name="Convert_1066182" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="618" name="self.model.model.decoder.layers.20.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="19116096" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="619" name="Convert_1066185" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="620" name="self.model.model.decoder.layers.20.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="621" name="self.model.model.decoder.layers.20.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="19120192" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="622" name="self.model.model.decoder.layers.20.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="623" name="Constant_1066190" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="624" name="Reshape_1066191" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="625" name="self.model.model.decoder.layers.20.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="626" name="__module.model.model.decoder.layers.20.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="627" name="Constant_54803" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="19136576" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="628" name="__module.model.model.decoder.layers.20.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2730,tensor.251"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="629" name="Constant_58123" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="630" name="__module.model.model.decoder.layers.20.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2732"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="631" name="__module.model.model.decoder.layers.20.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="632" name="__module.model.model.decoder.layers.20.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2733"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="633" name="ReadValue_61505" type="ReadValue" version="opset6"> <data variable_id="2733" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="635" name="self.model.model.decoder.layers.10.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="19140672" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="636" name="Convert_1070481" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="637" name="self.model.model.decoder.layers.10.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="19664960" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="638" name="Convert_1070484" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="639" name="self.model.model.decoder.layers.10.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="640" name="self.model.model.decoder.layers.10.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="19669056" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="641" name="self.model.model.decoder.layers.10.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="642" name="Constant_1070489" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="643" name="Reshape_1070490" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="644" name="self.model.model.decoder.layers.10.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="645" name="__module.model.model.decoder.layers.10.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="646" name="Constant_54663" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="19685440" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="647" name="__module.model.model.decoder.layers.10.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1570,tensor.131"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="648" name="Constant_58043" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="649" name="__module.model.model.decoder.layers.10.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1572"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="650" name="__module.model.model.decoder.layers.10.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="651" name="__module.model.model.decoder.layers.10.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1573"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="652" name="ReadValue_61503" type="ReadValue" version="opset6"> <data variable_id="1573" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="654" name="self.model.model.decoder.layers.19.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="19689536" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="655" name="Convert_1074780" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="656" name="self.model.model.decoder.layers.19.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="20213824" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="657" name="Convert_1074783" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="658" name="self.model.model.decoder.layers.19.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="659" name="self.model.model.decoder.layers.19.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="20217920" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="660" name="self.model.model.decoder.layers.19.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="661" name="Constant_1074788" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="662" name="Reshape_1074789" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="663" name="self.model.model.decoder.layers.19.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="664" name="__module.model.model.decoder.layers.19.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="665" name="Constant_54789" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="20234304" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="666" name="__module.model.model.decoder.layers.19.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2614,tensor.239"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="667" name="Constant_58115" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="668" name="__module.model.model.decoder.layers.19.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2616"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="669" name="__module.model.model.decoder.layers.19.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="670" name="__module.model.model.decoder.layers.19.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2617"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="671" name="ReadValue_61501" type="ReadValue" version="opset6"> <data variable_id="2617" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="673" name="self.model.model.decoder.layers.20.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="20238400" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="674" name="Convert_1079079" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="675" name="self.model.model.decoder.layers.20.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="20762688" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="676" name="Convert_1079082" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="677" name="self.model.model.decoder.layers.20.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="678" name="self.model.model.decoder.layers.20.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="20766784" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="679" name="self.model.model.decoder.layers.20.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="680" name="Constant_1079087" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="681" name="Reshape_1079088" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="682" name="self.model.model.decoder.layers.20.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="683" name="__module.model.model.decoder.layers.20.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2723,tensor.249"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="684" name="Constant_58122" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="685" name="__module.model.model.decoder.layers.20.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2725"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="686" name="__module.model.model.decoder.layers.20.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="687" name="__module.model.model.decoder.layers.20.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2726"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="688" name="ReadValue_61499" type="ReadValue" version="opset6"> <data variable_id="2726" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="690" name="self.model.model.decoder.layers.10.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="20783168" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="691" name="Convert_1083378" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="692" name="self.model.model.decoder.layers.10.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="21307456" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="693" name="Convert_1083381" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="694" name="self.model.model.decoder.layers.10.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="695" name="self.model.model.decoder.layers.10.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="21311552" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="696" name="self.model.model.decoder.layers.10.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="697" name="Constant_1083386" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="698" name="Reshape_1083387" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="699" name="self.model.model.decoder.layers.10.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="700" name="__module.model.model.decoder.layers.10.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1563,tensor.129"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="701" name="Constant_58042" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="702" name="__module.model.model.decoder.layers.10.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1565"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="703" name="__module.model.model.decoder.layers.10.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="704" name="__module.model.model.decoder.layers.10.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1566"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="705" name="ReadValue_61497" type="ReadValue" version="opset6"> <data variable_id="1566" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="707" name="self.model.model.decoder.layers.9.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="21327936" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="708" name="Convert_1087677" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="709" name="self.model.model.decoder.layers.9.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="21852224" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="710" name="Convert_1087680" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="711" name="self.model.model.decoder.layers.9.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="712" name="self.model.model.decoder.layers.9.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="21856320" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="713" name="self.model.model.decoder.layers.9.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="714" name="Constant_1087685" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="715" name="Reshape_1087686" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="716" name="self.model.model.decoder.layers.9.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="717" name="__module.model.model.decoder.layers.9.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="718" name="Constant_54649" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="21872704" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="719" name="__module.model.model.decoder.layers.9.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1454,tensor.119"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="720" name="Constant_58035" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="721" name="__module.model.model.decoder.layers.9.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1456"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="722" name="__module.model.model.decoder.layers.9.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="723" name="__module.model.model.decoder.layers.9.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1457"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="724" name="ReadValue_61495" type="ReadValue" version="opset6"> <data variable_id="1457" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="726" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="21876800" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="727" name="Convert_1091976" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="728" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="22401088" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="729" name="Convert_1091979" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="730" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="731" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="22405184" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="732" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="733" name="Constant_1091984" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="734" name="Reshape_1091985" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="735" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="736" name="__module.model.model.decoder.layers.1.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="737" name="Constant_54537" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="22421568" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="738" name="__module.model.model.decoder.layers.1.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="526,tensor.23"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="739" name="Constant_57971" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="740" name="__module.model.model.decoder.layers.1.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="528"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="741" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="742" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="529"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="743" name="ReadValue_61493" type="ReadValue" version="opset6"> <data variable_id="529" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="745" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="22425664" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="746" name="Convert_1096275" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="747" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="22949952" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="748" name="Convert_1096278" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="749" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="750" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="22954048" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="751" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="752" name="Constant_1096283" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="753" name="Reshape_1096284" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="754" name="self.model.model.decoder.layers.2.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="755" name="__module.model.model.decoder.layers.2.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="635,tensor.33"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="756" name="Constant_57978" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="757" name="__module.model.model.decoder.layers.2.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="637"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="758" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="759" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="638"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="760" name="ReadValue_61491" type="ReadValue" version="opset6"> <data variable_id="638" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="762" name="self.model.model.decoder.layers.19.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="22970432" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="763" name="Convert_1100574" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="764" name="self.model.model.decoder.layers.19.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="23494720" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="765" name="Convert_1100577" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="766" name="self.model.model.decoder.layers.19.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="767" name="self.model.model.decoder.layers.19.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="23498816" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="768" name="self.model.model.decoder.layers.19.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="769" name="Constant_1100582" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="770" name="Reshape_1100583" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="771" name="self.model.model.decoder.layers.19.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="772" name="__module.model.model.decoder.layers.19.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2607,tensor.237"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="773" name="Constant_58114" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="774" name="__module.model.model.decoder.layers.19.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2609"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="775" name="__module.model.model.decoder.layers.19.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="776" name="__module.model.model.decoder.layers.19.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2610"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="777" name="ReadValue_61489" type="ReadValue" version="opset6"> <data variable_id="2610" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="779" name="self.model.model.decoder.layers.18.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="23515200" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="780" name="Convert_1104873" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="781" name="self.model.model.decoder.layers.18.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="24039488" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="782" name="Convert_1104876" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="783" name="self.model.model.decoder.layers.18.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="784" name="self.model.model.decoder.layers.18.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="24043584" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="785" name="self.model.model.decoder.layers.18.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="786" name="Constant_1104881" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="787" name="Reshape_1104882" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="788" name="self.model.model.decoder.layers.18.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="789" name="__module.model.model.decoder.layers.18.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="790" name="Constant_54775" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="24059968" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="791" name="__module.model.model.decoder.layers.18.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2498,tensor.227"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="792" name="Constant_58107" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="793" name="__module.model.model.decoder.layers.18.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2500"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="794" name="__module.model.model.decoder.layers.18.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="795" name="__module.model.model.decoder.layers.18.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2501"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="796" name="ReadValue_61487" type="ReadValue" version="opset6"> <data variable_id="2501" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="798" name="self.model.model.decoder.layers.9.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="24064064" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="799" name="Convert_1109172" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="800" name="self.model.model.decoder.layers.9.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="24588352" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="801" name="Convert_1109175" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="802" name="self.model.model.decoder.layers.9.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="803" name="self.model.model.decoder.layers.9.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="24592448" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="804" name="self.model.model.decoder.layers.9.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="805" name="Constant_1109180" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="806" name="Reshape_1109181" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="807" name="self.model.model.decoder.layers.9.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="808" name="__module.model.model.decoder.layers.9.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1447,tensor.117"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="809" name="Constant_58034" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="810" name="__module.model.model.decoder.layers.9.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1449"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="811" name="__module.model.model.decoder.layers.9.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="812" name="__module.model.model.decoder.layers.9.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1450"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="813" name="ReadValue_61485" type="ReadValue" version="opset6"> <data variable_id="1450" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="815" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="24608832" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="816" name="Convert_1113471" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="817" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="25133120" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="818" name="Convert_1113474" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="819" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="820" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="25137216" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="821" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="822" name="Constant_1113479" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="823" name="Reshape_1113480" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="824" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="825" name="__module.model.model.decoder.layers.1.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="519,tensor.21"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="826" name="Constant_57970" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="827" name="__module.model.model.decoder.layers.1.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="521"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="828" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="829" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="522"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="830" name="ReadValue_61483" type="ReadValue" version="opset6"> <data variable_id="522" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="832" name="self.model.model.decoder.layers.17.encoder_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="25153600" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="833" name="Convert_1117770" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="834" name="self.model.model.decoder.layers.17.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="25677888" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="835" name="Convert_1117773" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="836" name="self.model.model.decoder.layers.17.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="837" name="self.model.model.decoder.layers.17.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="25681984" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="838" name="self.model.model.decoder.layers.17.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="839" name="Constant_1117778" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="840" name="Reshape_1117779" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="841" name="self.model.model.decoder.layers.17.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="842" name="__module.model.model.decoder.layers.17.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="843" name="Constant_54761" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="25698368" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="844" name="__module.model.model.decoder.layers.17.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2382,tensor.215"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="845" name="Constant_58099" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="846" name="__module.model.model.decoder.layers.17.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2384"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="847" name="__module.model.model.decoder.layers.17.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="848" name="__module.model.model.decoder.layers.17.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2385"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="849" name="ReadValue_61481" type="ReadValue" version="opset6"> <data variable_id="2385" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="851" name="self.model.model.decoder.layers.18.encoder_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="25702464" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="852" name="Convert_1122069" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="853" name="self.model.model.decoder.layers.18.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="26226752" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="854" name="Convert_1122072" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="855" name="self.model.model.decoder.layers.18.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="856" name="self.model.model.decoder.layers.18.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="26230848" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="857" name="self.model.model.decoder.layers.18.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="858" name="Constant_1122077" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="859" name="Reshape_1122078" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="860" name="self.model.model.decoder.layers.18.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="861" name="__module.model.model.decoder.layers.18.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2491,tensor.225"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="862" name="Constant_58106" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="863" name="__module.model.model.decoder.layers.18.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2493"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="864" name="__module.model.model.decoder.layers.18.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="865" name="__module.model.model.decoder.layers.18.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2494"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="866" name="ReadValue_61479" type="ReadValue" version="opset6"> <data variable_id="2494" variable_type="dynamic" variable_shape="..." /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="868" name="Constant_60433" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="869" name="ShapeOf_60419" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="870" name="Constant_60421" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="871" name="Constant_60423" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="872" name="Gather_60424" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="873" name="Constant_60426" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="874" name="Constant_60428" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="875" name="Constant_60430" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="876" name="Concat_60431" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="877" name="Broadcast_60434" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="878" name="ReadValue_60035" type="ReadValue" version="opset6"> <data variable_id="past_key_values.9.decoder.valuepresent.9.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.9.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="879" name="Constant_59473" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="880" name="Gather_59474" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="881" name="self.model.model.decoder.embed_tokens.weight" type="Const" version="opset1"> <data element_type="u8" shape="51864, 1024" offset="26247260" size="53108736" /> <output> <port id="0" precision="U8"> <dim>51864</dim> <dim>1024</dim> </port> </output> </layer> <layer id="882" name="Convert_709367" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>51864</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>51864</dim> <dim>1024</dim> </port> </output> </layer> <layer id="883" name="self.model.model.decoder.embed_tokens.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="51864, 1" offset="79355996" size="51864" /> <output> <port id="0" precision="U8"> <dim>51864</dim> <dim>1</dim> </port> </output> </layer> <layer id="884" name="Convert_709370" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>51864</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>51864</dim> <dim>1</dim> </port> </output> </layer> <layer id="885" name="self.model.model.decoder.embed_tokens.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>51864</dim> <dim>1024</dim> </port> <port id="1" precision="FP16"> <dim>51864</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>51864</dim> <dim>1024</dim> </port> </output> </layer> <layer id="886" name="self.model.model.decoder.embed_tokens.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="51864, 1" offset="79407860" size="103728" /> <output> <port id="0" precision="FP16"> <dim>51864</dim> <dim>1</dim> </port> </output> </layer> <layer id="887" name="self.model.model.decoder.embed_tokens.weight/fq_weights_0" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>51864</dim> <dim>1024</dim> </port> <port id="1" precision="FP16"> <dim>51864</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>51864</dim> <dim>1024</dim> </port> </output> </layer> <layer id="888" name="self.model.model.decoder.embed_tokens.weight/fq_weights_0/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>51864</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>51864</dim> <dim>1024</dim> </port> </output> </layer> <layer id="889" name="__module.model.model.decoder/prim::ListConstruct" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="79511588" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="890" name="__module.model.model.decoder/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="I64" names="289"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="891" name="__module.model.model.decoder.embed_tokens/aten::embedding/Convert" type="Convert" version="opset1"> <data destination_type="i32" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I32"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="892" name="__module.model.model.decoder.embed_tokens/aten::embedding/Constant" type="Const" version="opset1"> <data element_type="i32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="893" name="__module.model.model.decoder.embed_tokens/aten::embedding/Gather" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>51864</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="FP32" names="291,inputs_embeds"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="894" name="self.model.model.decoder.embed_positions.weight" type="Const" version="opset1"> <data element_type="u8" shape="448, 1024" offset="79511604" size="458752" /> <output> <port id="0" precision="U8"> <dim>448</dim> <dim>1024</dim> </port> </output> </layer> <layer id="895" name="Convert_1745422" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>448</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>448</dim> <dim>1024</dim> </port> </output> </layer> <layer id="896" name="self.model.model.decoder.embed_positions.weight/zero_point" type="Const" version="opset1"> <data element_type="u8" shape="448, 1" offset="79970356" size="448" /> <output> <port id="0" precision="U8"> <dim>448</dim> <dim>1</dim> </port> </output> </layer> <layer id="897" name="Convert_1745425" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U8"> <dim>448</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>448</dim> <dim>1</dim> </port> </output> </layer> <layer id="898" name="self.model.model.decoder.embed_positions.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>448</dim> <dim>1024</dim> </port> <port id="1" precision="FP16"> <dim>448</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>448</dim> <dim>1024</dim> </port> </output> </layer> <layer id="899" name="self.model.model.decoder.embed_positions.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="448, 1" offset="79970804" size="896" /> <output> <port id="0" precision="FP16"> <dim>448</dim> <dim>1</dim> </port> </output> </layer> <layer id="900" name="self.model.model.decoder.embed_positions.weight/fq_weights_0" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>448</dim> <dim>1024</dim> </port> <port id="1" precision="FP16"> <dim>448</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>448</dim> <dim>1024</dim> </port> </output> </layer> <layer id="901" name="self.model.model.decoder.embed_positions.weight/fq_weights_0/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>448</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>448</dim> <dim>1024</dim> </port> </output> </layer> <layer id="902" name="221" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" names="221" /> </output> </layer> <layer id="903" name="__module.model.model.decoder/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I64"> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="292"> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="904" name="ShapeOf_55745" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="905" name="Constant_55746" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="906" name="Constant_55747" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="907" name="Gather_55748" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="1037,1089,1153,1205,1269,1321,1385,1437,1501,1553,1617,1669,1733,1785,1849,1901,1965,2017,2081,2133,2197,2249,2313,2365,2429,2481,2545,2597,2661,2713,2777,2829,286,2893,2945,3009,3061,309,338,393,457,509,573,625,689,741,805,857,921,973"> <dim>1</dim> </port> </output> </layer> <layer id="908" name="Constant_33718" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="79971700" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="909" name="__module.model.model.decoder/prim::ListConstruct/Concat" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64" names="293"> <dim>2</dim> </port> </output> </layer> <layer id="910" name="__module.model.model.decoder/aten::repeat/Tile" type="Tile" version="opset1"> <input> <port id="0" precision="I64"> <dim>1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="I64" names="294,position_ids"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="911" name="__module.model.model.decoder.embed_positions/aten::index/Convert" type="Convert" version="opset1"> <data destination_type="i32" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I32"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="912" name="__module.model.model.decoder.embed_positions/aten::index/Constant" type="Const" version="opset1"> <data element_type="i32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="913" name="__module.model.model.decoder.embed_positions/aten::index/Gather" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>448</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="FP32" names="297,298,positions,positions.1"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="914" name="__module.model.model.decoder/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="299,input.1"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="915" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="916" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="917" name="Constant_54514" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="79971712" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="918" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="919" name="Constant_54515" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="79975808" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="920" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="333,hidden_states.1"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="921" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="79979904" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="922" name="Convert_1134966" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="923" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="80504192" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="924" name="Convert_1134969" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="925" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="926" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="80508288" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="927" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="928" name="Constant_1134974" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="929" name="Reshape_1134975" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="930" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="931" name="__module.model.model.decoder.layers.0.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="932" name="Constant_54516" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="80524672" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="933" name="__module.model.model.decoder.layers.0.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="342,tensor.1"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="934" name="Constant_57957" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="935" name="__module.model.model.decoder.layers.0.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="344"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="936" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="937" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="345"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="938" name="Constant_60445" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="939" name="Constant_60438" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="940" name="Constant_60440" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="941" name="Constant_60442" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="942" name="Concat_60443" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="943" name="Broadcast_60446" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="944" name="ReadValue_59941" type="ReadValue" version="opset6"> <data variable_id="past_key_values.0.decoder.keypresent.0.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.0.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="945" name="Constant_59416" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="946" name="Gather_59417" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="947" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="80528768" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="948" name="Convert_1130667" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="949" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="81053056" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="950" name="Convert_1130670" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="951" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="952" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="81057152" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="953" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="954" name="Constant_1130675" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="955" name="Reshape_1130676" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="956" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="957" name="__module.model.model.decoder.layers.0.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="348,tensor.3"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="958" name="Constant_57958" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="959" name="__module.model.model.decoder.layers.0.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="350"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="960" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="961" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="351"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="962" name="__module.model.model.decoder.layers.0.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.7"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="963" name="Constant_60457" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="964" name="Constant_60450" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="965" name="Constant_60452" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="966" name="Constant_60454" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="967" name="Concat_60455" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="968" name="Broadcast_60458" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="969" name="ReadValue_59943" type="ReadValue" version="opset6"> <data variable_id="past_key_values.0.decoder.valuepresent.0.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.0.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="970" name="Constant_59419" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="971" name="Gather_59420" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="972" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="81073536" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="973" name="Convert_1126368" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="974" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="81597824" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="975" name="Convert_1126371" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="976" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="977" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="81601920" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="978" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="979" name="Constant_1126376" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="980" name="Reshape_1126377" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="981" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="982" name="__module.model.model.decoder.layers.0.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="983" name="Constant_54517" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="81618304" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="984" name="__module.model.model.decoder.layers.0.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="355,tensor.5"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="985" name="Constant_57959" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="986" name="__module.model.model.decoder.layers.0.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="357"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="987" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="988" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="358"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="989" name="__module.model.model.decoder.layers.0.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="990" name="Constant_54518" type="Const" version="opset1"> <data element_type="f32" shape="1, 1" offset="81622400" size="4" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="991" name="__module.model.model.decoder/aten::arange/Constant" type="Const" version="opset1"> <data element_type="i32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="992" name="ShapeOf_55761" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="993" name="Constant_55762" type="Const" version="opset1"> <data element_type="i64" shape="" offset="81622404" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="994" name="Constant_55763" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="995" name="Gather_55764" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>4</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="301" /> </output> </layer> <layer id="996" name="Constant_55770" type="Const" version="opset1"> <data element_type="i64" shape="" offset="79971700" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="997" name="Constant_55771" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="998" name="Gather_55772" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="303" /> </output> </layer> <layer id="999" name="__module.model.model.decoder/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="305" /> </output> </layer> <layer id="1000" name="__module.model.model.decoder/aten::add/Multiply_2" type="Const" version="opset1"> <data element_type="i64" shape="" offset="79971700" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1001" name="__module.model.model.decoder/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="306,308" /> </output> </layer> <layer id="1002" name="__module.model.model.decoder/aten::arange/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="" offset="81622412" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="1003" name="__module.model.model.decoder/aten::arange/Range" type="Range" version="opset4"> <data output_type="f32" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I64" /> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> </port> </output> </layer> <layer id="1004" name="__module.model.model.decoder/aten::arange/ConvertLike" type="Convert" version="opset1"> <data destination_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64" names="312"> <dim>-1</dim> </port> </output> </layer> <layer id="1005" name="Constant_19376" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="81622416" size="16" /> <output> <port id="0" precision="I64" names="313"> <dim>2</dim> </port> </output> </layer> <layer id="1006" name="__module.model.model.decoder/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64"> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="I64" names="314"> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1007" name="__module.model.model.decoder/aten::gt/Greater" type="Greater" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="BOOL" names="315"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1008" name="__module.model.model.decoder/aten::mul_/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="BOOL"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1009" name="Multiply_45374" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1010" name="ShapeOf_45375" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1011" name="Constant_55775" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="79971700" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1012" name="Reshape_55776" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1013" name="Constant_19362" type="Const" version="opset1"> <data element_type="i32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="1014" name="Unsqueeze_19363" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I64" /> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1015" name="__module.model.model.decoder/prim::ListConstruct_1" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1016" name="Maximum_45376" type="Maximum" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1017" name="__module.model.model.decoder/aten::mul_/Multiply" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP32" names="311,causal_mask.1"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1018" name="__module.model.model.decoder/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="317"> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1019" name="222" type="Const" version="opset1"> <data element_type="i64" shape="" offset="79971700" size="8" /> <output> <port id="0" precision="I64" names="222" /> </output> </layer> <layer id="1020" name="__module.model.model.decoder/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="318,319,320"> <dim>1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1021" name="Constant_44039" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="79971700" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1022" name="Constant_44041" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="79971700" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1023" name="Constant_44043" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="79971700" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1024" name="__module.model.model.decoder/prim::ListConstruct_2" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1025" name="__module.model.model.decoder/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1064,1065,1066,1180,1181,1182,1296,1297,1298,1412,1413,1414,1528,1529,1530,1644,1645,1646,1760,1761,1762,1876,1877,1878,1992,1993,1994,2108,2109,2110,2224,2225,2226,2340,2341,2342,2456,2457,2458,2572,2573,2574,2688,2689,2690,2804,2805,2806,2920,2921,2922,3036,3037,3038,322,368,369,370,484,485,486,600,601,602,716,717,718,832,833,834,948,949,950,attention_mask"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1026" name="Constant_19659" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1027" name="Constant_55783" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="79971700" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1028" name="Reshape_55784" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1029" name="Add_55787" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64" names="1063,1179,1295,1411,1527,1643,1759,1875,1991,2107,2223,2339,2455,2571,2687,2803,2919,3035,367,483,599,715,831,947"> <dim>1</dim> </port> </output> </layer> <layer id="1030" name="Constant_19662" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="79971700" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1031" name="Constant_19657" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="81622432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1032" name="__module.model.model.decoder.layers.0.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1067,1183,1299,1415,1531,1647,1763,1879,1995,2111,2227,2343,2459,2575,2691,2807,2923,3039,371,487,603,719,835,951"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1033" name="__module.model.model.decoder.layers.0.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="372,attn_output.1"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1034" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1035" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="373,attn_output.3"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1036" name="Constant_57960" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1037" name="__module.model.model.decoder.layers.0.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="375"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1038" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="81622464" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1039" name="Convert_1139265" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1040" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="82146752" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1041" name="Convert_1139268" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1042" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1043" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="82150848" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1044" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1045" name="Constant_1139273" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1046" name="Reshape_1139274" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1047" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1048" name="__module.model.model.decoder.layers.0.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1049" name="Constant_54519" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="82167232" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1050" name="__module.model.model.decoder.layers.0.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="378,380,input.3"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1051" name="__module.model.model.decoder.layers.0/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="384,residual.3"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1052" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1053" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1054" name="Constant_54520" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="82171328" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1055" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1056" name="Constant_54521" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="82175424" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1057" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="388,hidden_states.5"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1058" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="82179520" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1059" name="Convert_1143564" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1060" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="82703808" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1061" name="Convert_1143567" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1062" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1063" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="82707904" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1064" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1065" name="Constant_1143572" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1066" name="Reshape_1143573" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1067" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1068" name="__module.model.model.decoder.layers.0.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1069" name="Constant_54522" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="82724288" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1070" name="__module.model.model.decoder.layers.0.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="397,tensor.7"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1071" name="Constant_57961" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1072" name="__module.model.model.decoder.layers.0.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="399"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1073" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1074" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="400"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1075" name="__module.model.model.decoder.layers.0.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="415,attn_output.5"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1076" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1077" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="416,attn_output.7"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1078" name="Constant_57964" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1079" name="__module.model.model.decoder.layers.0.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="418"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1080" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="82728384" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1081" name="Convert_1147863" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1082" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="83252672" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1083" name="Convert_1147866" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1084" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1085" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="83256768" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1086" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1087" name="Constant_1147871" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1088" name="Reshape_1147872" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1089" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1090" name="__module.model.model.decoder.layers.0.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1091" name="Constant_54524" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="83273152" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1092" name="__module.model.model.decoder.layers.0.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="421,input.5"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1093" name="__module.model.model.decoder.layers.0/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="423,residual.5"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1094" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1095" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1096" name="Constant_54525" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="83277248" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1097" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1098" name="Constant_54526" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="83281344" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1099" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="427"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1100" name="self.model.model.decoder.layers.0.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="83285440" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1101" name="Convert_713664" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1102" name="self.model.model.decoder.layers.0.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="85382592" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1103" name="Convert_713667" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1104" name="self.model.model.decoder.layers.0.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1105" name="self.model.model.decoder.layers.0.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="85398976" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1106" name="self.model.model.decoder.layers.0.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1107" name="Constant_713672" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1108" name="Reshape_713673" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1109" name="self.model.model.decoder.layers.0.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1110" name="__module.model.model.decoder.layers.0.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1111" name="Constant_54527" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="85464528" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1112" name="__module.model.model.decoder.layers.0.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="430"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1113" name="__module.model.model.decoder.layers.0.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="431,input.7"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1114" name="self.model.model.decoder.layers.0.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="85480912" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1115" name="Convert_717963" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1116" name="self.model.model.decoder.layers.0.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="87578064" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1117" name="Convert_717966" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1118" name="self.model.model.decoder.layers.0.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1119" name="self.model.model.decoder.layers.0.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="87594448" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1120" name="self.model.model.decoder.layers.0.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1121" name="Constant_717971" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1122" name="Reshape_717972" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1123" name="self.model.model.decoder.layers.0.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1124" name="__module.model.model.decoder.layers.0.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1125" name="Constant_54528" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="87660000" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1126" name="__module.model.model.decoder.layers.0.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="435,input.9"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1127" name="__module.model.model.decoder.layers.0/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="437,439,residual.7"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1128" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1129" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1130" name="Constant_54529" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="87664096" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1131" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1132" name="Constant_54530" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="87668192" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1133" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="452,hidden_states.11"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1134" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="87672288" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1135" name="Convert_1160760" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1136" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="88196576" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1137" name="Convert_1160763" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1138" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1139" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="88200672" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1140" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1141" name="Constant_1160768" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1142" name="Reshape_1160769" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1143" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1144" name="__module.model.model.decoder.layers.1.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1145" name="Constant_54531" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="88217056" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1146" name="__module.model.model.decoder.layers.1.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="461,tensor.13"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1147" name="Constant_57965" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1148" name="__module.model.model.decoder.layers.1.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="463"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1149" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1150" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="464"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1151" name="Constant_60481" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1152" name="Constant_60474" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1153" name="Constant_60476" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1154" name="Constant_60478" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1155" name="Concat_60479" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1156" name="Broadcast_60482" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1157" name="ReadValue_59945" type="ReadValue" version="opset6"> <data variable_id="past_key_values.1.decoder.keypresent.1.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.1.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1158" name="Constant_59422" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1159" name="Gather_59423" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1160" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="88221152" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1161" name="Convert_1156461" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1162" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="88745440" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1163" name="Convert_1156464" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1164" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1165" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="88749536" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1166" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1167" name="Constant_1156469" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1168" name="Reshape_1156470" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1169" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1170" name="__module.model.model.decoder.layers.1.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="467,tensor.15"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1171" name="Constant_57966" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1172" name="__module.model.model.decoder.layers.1.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="469"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1173" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1174" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="470"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1175" name="__module.model.model.decoder.layers.1.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.11"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1176" name="Constant_60469" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1177" name="Constant_60462" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1178" name="Constant_60464" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1179" name="Constant_60466" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1180" name="Concat_60467" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1181" name="Broadcast_60470" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1182" name="ReadValue_59947" type="ReadValue" version="opset6"> <data variable_id="past_key_values.1.decoder.valuepresent.1.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.1.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1183" name="Constant_59425" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1184" name="Gather_59426" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1185" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="88765920" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1186" name="Convert_1152162" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1187" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="89290208" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1188" name="Convert_1152165" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1189" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1190" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="89294304" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1191" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1192" name="Constant_1152170" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1193" name="Reshape_1152171" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1194" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1195" name="__module.model.model.decoder.layers.1.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1196" name="Constant_54532" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="89310688" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1197" name="__module.model.model.decoder.layers.1.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="474,tensor.17"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1198" name="Constant_57967" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1199" name="__module.model.model.decoder.layers.1.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="476"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1200" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1201" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="477"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1202" name="__module.model.model.decoder.layers.1.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1203" name="__module.model.model.decoder.layers.1.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="488,attn_output.9"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1204" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1205" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="489,attn_output.11"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1206" name="Constant_57968" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1207" name="__module.model.model.decoder.layers.1.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="491"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1208" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="89314784" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1209" name="Convert_1165059" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1210" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="89839072" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1211" name="Convert_1165062" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1212" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1213" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="89843168" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1214" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1215" name="Constant_1165067" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1216" name="Reshape_1165068" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1217" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1218" name="__module.model.model.decoder.layers.1.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1219" name="Constant_54533" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="89859552" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1220" name="__module.model.model.decoder.layers.1.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="494,496,input.11"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1221" name="__module.model.model.decoder.layers.1/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="500,residual.9"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1222" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1223" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1224" name="Constant_54534" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="89863648" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1225" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1226" name="Constant_54535" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="89867744" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1227" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="504,hidden_states.15"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1228" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="89871840" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1229" name="Convert_1169358" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1230" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="90396128" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1231" name="Convert_1169361" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1232" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1233" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="90400224" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1234" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1235" name="Constant_1169366" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1236" name="Reshape_1169367" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1237" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1238" name="__module.model.model.decoder.layers.1.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1239" name="Constant_54536" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="90416608" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1240" name="__module.model.model.decoder.layers.1.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="513,tensor.19"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1241" name="Constant_57969" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1242" name="__module.model.model.decoder.layers.1.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="515"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1243" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1244" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="516"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1245" name="__module.model.model.decoder.layers.1.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="531,attn_output.13"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1246" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1247" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="532,attn_output.15"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1248" name="Constant_57972" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1249" name="__module.model.model.decoder.layers.1.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="534"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1250" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="90420704" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1251" name="Convert_1173657" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1252" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="90944992" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1253" name="Convert_1173660" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1254" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1255" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="90949088" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1256" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1257" name="Constant_1173665" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1258" name="Reshape_1173666" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1259" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1260" name="__module.model.model.decoder.layers.1.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1261" name="Constant_54538" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="90965472" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1262" name="__module.model.model.decoder.layers.1.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="537,input.13"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1263" name="__module.model.model.decoder.layers.1/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="539,residual.11"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1264" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1265" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1266" name="Constant_54539" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="90969568" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1267" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1268" name="Constant_54540" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="90973664" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1269" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="543"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1270" name="self.model.model.decoder.layers.1.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="90977760" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1271" name="Convert_722262" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1272" name="self.model.model.decoder.layers.1.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="93074912" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1273" name="Convert_722265" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1274" name="self.model.model.decoder.layers.1.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1275" name="self.model.model.decoder.layers.1.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="93091296" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1276" name="self.model.model.decoder.layers.1.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1277" name="Constant_722270" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1278" name="Reshape_722271" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1279" name="self.model.model.decoder.layers.1.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1280" name="__module.model.model.decoder.layers.1.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1281" name="Constant_54541" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="93156832" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1282" name="__module.model.model.decoder.layers.1.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="546"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1283" name="__module.model.model.decoder.layers.1.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="547,input.15"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1284" name="self.model.model.decoder.layers.1.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="93173216" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1285" name="Convert_726561" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1286" name="self.model.model.decoder.layers.1.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="95270368" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1287" name="Convert_726564" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1288" name="self.model.model.decoder.layers.1.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1289" name="self.model.model.decoder.layers.1.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="95286752" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1290" name="self.model.model.decoder.layers.1.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1291" name="Constant_726569" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1292" name="Reshape_726570" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1293" name="self.model.model.decoder.layers.1.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1294" name="__module.model.model.decoder.layers.1.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1295" name="Constant_54542" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="95352288" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1296" name="__module.model.model.decoder.layers.1.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="551,input.17"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1297" name="__module.model.model.decoder.layers.1/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="553,555,residual.13"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1298" name="__module.model.model.decoder.layers.2.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1299" name="__module.model.model.decoder.layers.2.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1300" name="Constant_54543" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="95356384" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1301" name="__module.model.model.decoder.layers.2.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1302" name="Constant_54544" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="95360480" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1303" name="__module.model.model.decoder.layers.2.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="568,hidden_states.21"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1304" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="95364576" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1305" name="Convert_1186554" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1306" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="95888864" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1307" name="Convert_1186557" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1308" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1309" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="95892960" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1310" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1311" name="Constant_1186562" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1312" name="Reshape_1186563" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1313" name="self.model.model.decoder.layers.2.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1314" name="__module.model.model.decoder.layers.2.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1315" name="Constant_54545" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="95909344" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1316" name="__module.model.model.decoder.layers.2.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="577,tensor.25"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1317" name="Constant_57973" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1318" name="__module.model.model.decoder.layers.2.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="579"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1319" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1320" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="580"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1321" name="Constant_60505" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1322" name="Constant_60498" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1323" name="Constant_60500" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1324" name="Constant_60502" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1325" name="Concat_60503" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1326" name="Broadcast_60506" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1327" name="ReadValue_59989" type="ReadValue" version="opset6"> <data variable_id="past_key_values.2.decoder.keypresent.2.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.2.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1328" name="Constant_59428" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1329" name="Gather_59429" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1330" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="95913440" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1331" name="Convert_1182255" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1332" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="96437728" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1333" name="Convert_1182258" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1334" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1335" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="96441824" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1336" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1337" name="Constant_1182263" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1338" name="Reshape_1182264" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1339" name="self.model.model.decoder.layers.2.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1340" name="__module.model.model.decoder.layers.2.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="583,tensor.27"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1341" name="Constant_57974" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1342" name="__module.model.model.decoder.layers.2.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="585"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1343" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1344" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="586"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1345" name="__module.model.model.decoder.layers.2.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.13"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1346" name="Constant_60493" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1347" name="Constant_60486" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1348" name="Constant_60488" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1349" name="Constant_60490" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1350" name="Concat_60491" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1351" name="Broadcast_60494" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1352" name="ReadValue_59991" type="ReadValue" version="opset6"> <data variable_id="past_key_values.2.decoder.valuepresent.2.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.2.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1353" name="Constant_59431" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1354" name="Gather_59432" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1355" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="96458208" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1356" name="Convert_1177956" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1357" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="96982496" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1358" name="Convert_1177959" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1359" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1360" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="96986592" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1361" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1362" name="Constant_1177964" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1363" name="Reshape_1177965" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1364" name="self.model.model.decoder.layers.2.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1365" name="__module.model.model.decoder.layers.2.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1366" name="Constant_54546" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="97002976" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1367" name="__module.model.model.decoder.layers.2.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="590,tensor.29"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1368" name="Constant_57975" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1369" name="__module.model.model.decoder.layers.2.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="592"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1370" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1371" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="593"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1372" name="__module.model.model.decoder.layers.2.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1373" name="__module.model.model.decoder.layers.2.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="604,attn_output.17"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1374" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1375" name="__module.model.model.decoder.layers.2.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="605,attn_output.19"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1376" name="Constant_57976" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1377" name="__module.model.model.decoder.layers.2.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="607"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1378" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="97007072" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1379" name="Convert_1190853" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1380" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="97531360" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1381" name="Convert_1190856" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1382" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1383" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="97535456" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1384" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1385" name="Constant_1190861" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1386" name="Reshape_1190862" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1387" name="self.model.model.decoder.layers.2.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1388" name="__module.model.model.decoder.layers.2.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1389" name="Constant_54547" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="97551840" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1390" name="__module.model.model.decoder.layers.2.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="610,612,input.19"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1391" name="__module.model.model.decoder.layers.2/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="616,residual.15"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1392" name="__module.model.model.decoder.layers.2.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1393" name="__module.model.model.decoder.layers.2.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1394" name="Constant_54548" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="97555936" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1395" name="__module.model.model.decoder.layers.2.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1396" name="Constant_54549" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="97560032" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1397" name="__module.model.model.decoder.layers.2.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="620,hidden_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1398" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="97564128" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1399" name="Convert_1195152" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1400" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="98088416" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1401" name="Convert_1195155" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1402" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1403" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="98092512" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1404" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1405" name="Constant_1195160" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1406" name="Reshape_1195161" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1407" name="self.model.model.decoder.layers.2.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1408" name="__module.model.model.decoder.layers.2.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1409" name="Constant_54550" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="98108896" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1410" name="__module.model.model.decoder.layers.2.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="629,tensor.31"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1411" name="Constant_57977" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1412" name="__module.model.model.decoder.layers.2.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="631"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1413" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1414" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="632"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1415" name="__module.model.model.decoder.layers.2.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="647,attn_output.21"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1416" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1417" name="__module.model.model.decoder.layers.2.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="648,attn_output.23"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1418" name="Constant_57980" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1419" name="__module.model.model.decoder.layers.2.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="650"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1420" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="98112992" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1421" name="Convert_1199451" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1422" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="98637280" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1423" name="Convert_1199454" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1424" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1425" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="98641376" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1426" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1427" name="Constant_1199459" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1428" name="Reshape_1199460" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1429" name="self.model.model.decoder.layers.2.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1430" name="__module.model.model.decoder.layers.2.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1431" name="Constant_54552" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="98657760" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1432" name="__module.model.model.decoder.layers.2.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="653,input.21"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1433" name="__module.model.model.decoder.layers.2/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="655,residual.17"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1434" name="__module.model.model.decoder.layers.2.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1435" name="__module.model.model.decoder.layers.2.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1436" name="Constant_54553" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="98661856" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1437" name="__module.model.model.decoder.layers.2.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1438" name="Constant_54554" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="98665952" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1439" name="__module.model.model.decoder.layers.2.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="659"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1440" name="self.model.model.decoder.layers.2.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="98670048" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1441" name="Convert_730860" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1442" name="self.model.model.decoder.layers.2.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="100767200" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1443" name="Convert_730863" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1444" name="self.model.model.decoder.layers.2.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1445" name="self.model.model.decoder.layers.2.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="100783584" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1446" name="self.model.model.decoder.layers.2.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1447" name="Constant_730868" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1448" name="Reshape_730869" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1449" name="self.model.model.decoder.layers.2.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1450" name="__module.model.model.decoder.layers.2.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1451" name="Constant_54555" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="100849120" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1452" name="__module.model.model.decoder.layers.2.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="662"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1453" name="__module.model.model.decoder.layers.2.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="663,input.23"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1454" name="self.model.model.decoder.layers.2.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="100865504" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1455" name="Convert_735159" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1456" name="self.model.model.decoder.layers.2.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="102962656" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1457" name="Convert_735162" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1458" name="self.model.model.decoder.layers.2.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1459" name="self.model.model.decoder.layers.2.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="102979040" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1460" name="self.model.model.decoder.layers.2.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1461" name="Constant_735167" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1462" name="Reshape_735168" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1463" name="self.model.model.decoder.layers.2.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1464" name="__module.model.model.decoder.layers.2.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1465" name="Constant_54556" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="103044576" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1466" name="__module.model.model.decoder.layers.2.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="667,input.25"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1467" name="__module.model.model.decoder.layers.2/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="669,671,residual.19"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1468" name="__module.model.model.decoder.layers.3.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1469" name="__module.model.model.decoder.layers.3.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1470" name="Constant_54557" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="103048672" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1471" name="__module.model.model.decoder.layers.3.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1472" name="Constant_54558" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="103052768" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1473" name="__module.model.model.decoder.layers.3.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="684,hidden_states.31"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1474" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="103056864" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1475" name="Convert_1212348" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1476" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="103581152" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1477" name="Convert_1212351" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1478" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1479" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="103585248" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1480" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1481" name="Constant_1212356" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1482" name="Reshape_1212357" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1483" name="self.model.model.decoder.layers.3.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1484" name="__module.model.model.decoder.layers.3.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1485" name="Constant_54559" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="103601632" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1486" name="__module.model.model.decoder.layers.3.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="693,tensor.37"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1487" name="Constant_57981" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1488" name="__module.model.model.decoder.layers.3.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="695"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1489" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1490" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="696"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1491" name="Constant_60529" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1492" name="Constant_60522" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1493" name="Constant_60524" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1494" name="Constant_60526" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1495" name="Concat_60527" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1496" name="Broadcast_60530" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1497" name="ReadValue_60009" type="ReadValue" version="opset6"> <data variable_id="past_key_values.3.decoder.keypresent.3.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.3.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1498" name="Constant_59434" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1499" name="Gather_59435" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1500" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="103605728" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1501" name="Convert_1208049" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1502" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="104130016" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1503" name="Convert_1208052" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1504" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1505" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="104134112" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1506" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1507" name="Constant_1208057" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1508" name="Reshape_1208058" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1509" name="self.model.model.decoder.layers.3.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1510" name="__module.model.model.decoder.layers.3.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="699,tensor.39"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1511" name="Constant_57982" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1512" name="__module.model.model.decoder.layers.3.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="701"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1513" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1514" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="702"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1515" name="__module.model.model.decoder.layers.3.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.15"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1516" name="Constant_60517" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1517" name="Constant_60510" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1518" name="Constant_60512" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1519" name="Constant_60514" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1520" name="Concat_60515" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1521" name="Broadcast_60518" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1522" name="ReadValue_60011" type="ReadValue" version="opset6"> <data variable_id="past_key_values.3.decoder.valuepresent.3.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.3.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1523" name="Constant_59437" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1524" name="Gather_59438" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1525" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="104150496" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1526" name="Convert_1203750" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1527" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="104674784" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1528" name="Convert_1203753" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1529" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1530" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="104678880" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1531" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1532" name="Constant_1203758" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1533" name="Reshape_1203759" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1534" name="self.model.model.decoder.layers.3.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1535" name="__module.model.model.decoder.layers.3.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1536" name="Constant_54560" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="104695264" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1537" name="__module.model.model.decoder.layers.3.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="706,tensor.41"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1538" name="Constant_57983" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1539" name="__module.model.model.decoder.layers.3.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="708"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1540" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1541" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="709"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1542" name="__module.model.model.decoder.layers.3.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1543" name="__module.model.model.decoder.layers.3.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="720,attn_output.25"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1544" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1545" name="__module.model.model.decoder.layers.3.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="721,attn_output.27"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1546" name="Constant_57984" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1547" name="__module.model.model.decoder.layers.3.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="723"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1548" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="104699360" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1549" name="Convert_1216647" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1550" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="105223648" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1551" name="Convert_1216650" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1552" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1553" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="105227744" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1554" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1555" name="Constant_1216655" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1556" name="Reshape_1216656" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1557" name="self.model.model.decoder.layers.3.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1558" name="__module.model.model.decoder.layers.3.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1559" name="Constant_54561" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="105244128" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1560" name="__module.model.model.decoder.layers.3.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="726,728,input.27"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1561" name="__module.model.model.decoder.layers.3/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="732,residual.21"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1562" name="__module.model.model.decoder.layers.3.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1563" name="__module.model.model.decoder.layers.3.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1564" name="Constant_54562" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="105248224" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1565" name="__module.model.model.decoder.layers.3.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1566" name="Constant_54563" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="105252320" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1567" name="__module.model.model.decoder.layers.3.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="736,hidden_states.35"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1568" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="105256416" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1569" name="Convert_1220946" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1570" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="105780704" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1571" name="Convert_1220949" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1572" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1573" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="105784800" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1574" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1575" name="Constant_1220954" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1576" name="Reshape_1220955" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1577" name="self.model.model.decoder.layers.3.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1578" name="__module.model.model.decoder.layers.3.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1579" name="Constant_54564" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="105801184" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1580" name="__module.model.model.decoder.layers.3.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="745,tensor.43"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1581" name="Constant_57985" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1582" name="__module.model.model.decoder.layers.3.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="747"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1583" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1584" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="748"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1585" name="__module.model.model.decoder.layers.3.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="763,attn_output.29"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1586" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1587" name="__module.model.model.decoder.layers.3.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="764,attn_output.31"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1588" name="Constant_57988" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1589" name="__module.model.model.decoder.layers.3.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="766"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1590" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="105805280" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1591" name="Convert_1225245" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1592" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="106329568" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1593" name="Convert_1225248" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1594" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1595" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="106333664" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1596" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1597" name="Constant_1225253" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1598" name="Reshape_1225254" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1599" name="self.model.model.decoder.layers.3.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1600" name="__module.model.model.decoder.layers.3.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1601" name="Constant_54566" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="106350048" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1602" name="__module.model.model.decoder.layers.3.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="769,input.29"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1603" name="__module.model.model.decoder.layers.3/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="771,residual.23"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1604" name="__module.model.model.decoder.layers.3.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1605" name="__module.model.model.decoder.layers.3.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1606" name="Constant_54567" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="106354144" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1607" name="__module.model.model.decoder.layers.3.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1608" name="Constant_54568" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="106358240" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1609" name="__module.model.model.decoder.layers.3.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="775"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1610" name="self.model.model.decoder.layers.3.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="106362336" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1611" name="Convert_739458" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1612" name="self.model.model.decoder.layers.3.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="108459488" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1613" name="Convert_739461" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1614" name="self.model.model.decoder.layers.3.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1615" name="self.model.model.decoder.layers.3.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="108475872" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1616" name="self.model.model.decoder.layers.3.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1617" name="Constant_739466" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1618" name="Reshape_739467" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1619" name="self.model.model.decoder.layers.3.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1620" name="__module.model.model.decoder.layers.3.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1621" name="Constant_54569" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="108541408" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1622" name="__module.model.model.decoder.layers.3.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="778"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1623" name="__module.model.model.decoder.layers.3.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="779,input.31"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1624" name="self.model.model.decoder.layers.3.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="108557792" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1625" name="Convert_743757" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1626" name="self.model.model.decoder.layers.3.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="110654944" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1627" name="Convert_743760" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1628" name="self.model.model.decoder.layers.3.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1629" name="self.model.model.decoder.layers.3.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="110671328" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1630" name="self.model.model.decoder.layers.3.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1631" name="Constant_743765" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1632" name="Reshape_743766" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1633" name="self.model.model.decoder.layers.3.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1634" name="__module.model.model.decoder.layers.3.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1635" name="Constant_54570" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="110736864" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1636" name="__module.model.model.decoder.layers.3.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="783,input.33"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1637" name="__module.model.model.decoder.layers.3/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="785,787,residual.25"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1638" name="__module.model.model.decoder.layers.4.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1639" name="__module.model.model.decoder.layers.4.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1640" name="Constant_54571" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="110740960" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1641" name="__module.model.model.decoder.layers.4.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1642" name="Constant_54572" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="110745056" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1643" name="__module.model.model.decoder.layers.4.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="800,hidden_states.41"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1644" name="self.model.model.decoder.layers.4.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="110749152" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1645" name="Convert_1238142" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1646" name="self.model.model.decoder.layers.4.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="111273440" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1647" name="Convert_1238145" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1648" name="self.model.model.decoder.layers.4.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1649" name="self.model.model.decoder.layers.4.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="111277536" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1650" name="self.model.model.decoder.layers.4.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1651" name="Constant_1238150" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1652" name="Reshape_1238151" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1653" name="self.model.model.decoder.layers.4.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1654" name="__module.model.model.decoder.layers.4.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1655" name="Constant_54573" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="111293920" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1656" name="__module.model.model.decoder.layers.4.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="809,tensor.49"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1657" name="Constant_57989" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1658" name="__module.model.model.decoder.layers.4.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="811"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1659" name="__module.model.model.decoder.layers.4.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1660" name="__module.model.model.decoder.layers.4.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="812"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1661" name="Constant_60553" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1662" name="Constant_60546" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1663" name="Constant_60548" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1664" name="Constant_60550" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1665" name="Concat_60551" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1666" name="Broadcast_60554" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1667" name="ReadValue_60013" type="ReadValue" version="opset6"> <data variable_id="past_key_values.4.decoder.keypresent.4.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.4.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1668" name="Constant_59440" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1669" name="Gather_59441" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1670" name="self.model.model.decoder.layers.4.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="111298016" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1671" name="Convert_1233843" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1672" name="self.model.model.decoder.layers.4.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="111822304" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1673" name="Convert_1233846" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1674" name="self.model.model.decoder.layers.4.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1675" name="self.model.model.decoder.layers.4.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="111826400" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1676" name="self.model.model.decoder.layers.4.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1677" name="Constant_1233851" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1678" name="Reshape_1233852" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1679" name="self.model.model.decoder.layers.4.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1680" name="__module.model.model.decoder.layers.4.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="815,tensor.51"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1681" name="Constant_57990" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1682" name="__module.model.model.decoder.layers.4.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="817"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1683" name="__module.model.model.decoder.layers.4.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1684" name="__module.model.model.decoder.layers.4.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="818"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1685" name="__module.model.model.decoder.layers.4.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.17"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1686" name="Constant_60541" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1687" name="Constant_60534" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1688" name="Constant_60536" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1689" name="Constant_60538" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1690" name="Concat_60539" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1691" name="Broadcast_60542" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1692" name="ReadValue_60015" type="ReadValue" version="opset6"> <data variable_id="past_key_values.4.decoder.valuepresent.4.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.4.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1693" name="Constant_59443" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1694" name="Gather_59444" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1695" name="self.model.model.decoder.layers.4.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="111842784" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1696" name="Convert_1229544" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1697" name="self.model.model.decoder.layers.4.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="112367072" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1698" name="Convert_1229547" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1699" name="self.model.model.decoder.layers.4.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1700" name="self.model.model.decoder.layers.4.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="112371168" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1701" name="self.model.model.decoder.layers.4.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1702" name="Constant_1229552" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1703" name="Reshape_1229553" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1704" name="self.model.model.decoder.layers.4.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1705" name="__module.model.model.decoder.layers.4.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1706" name="Constant_54574" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="112387552" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1707" name="__module.model.model.decoder.layers.4.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="822,tensor.53"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1708" name="Constant_57991" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1709" name="__module.model.model.decoder.layers.4.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="824"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1710" name="__module.model.model.decoder.layers.4.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1711" name="__module.model.model.decoder.layers.4.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="825"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1712" name="__module.model.model.decoder.layers.4.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1713" name="__module.model.model.decoder.layers.4.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="836,attn_output.33"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1714" name="__module.model.model.decoder.layers.4.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1715" name="__module.model.model.decoder.layers.4.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="837,attn_output.35"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1716" name="Constant_57992" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1717" name="__module.model.model.decoder.layers.4.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="839"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1718" name="self.model.model.decoder.layers.4.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="112391648" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1719" name="Convert_1242441" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1720" name="self.model.model.decoder.layers.4.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="112915936" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1721" name="Convert_1242444" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1722" name="self.model.model.decoder.layers.4.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1723" name="self.model.model.decoder.layers.4.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="112920032" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1724" name="self.model.model.decoder.layers.4.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1725" name="Constant_1242449" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1726" name="Reshape_1242450" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1727" name="self.model.model.decoder.layers.4.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1728" name="__module.model.model.decoder.layers.4.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1729" name="Constant_54575" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="112936416" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1730" name="__module.model.model.decoder.layers.4.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="842,844,input.35"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1731" name="__module.model.model.decoder.layers.4/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="848,residual.27"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1732" name="__module.model.model.decoder.layers.4.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1733" name="__module.model.model.decoder.layers.4.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1734" name="Constant_54576" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="112940512" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1735" name="__module.model.model.decoder.layers.4.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1736" name="Constant_54577" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="112944608" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1737" name="__module.model.model.decoder.layers.4.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="852,hidden_states.45"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1738" name="self.model.model.decoder.layers.4.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="112948704" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1739" name="Convert_1246740" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1740" name="self.model.model.decoder.layers.4.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="113472992" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1741" name="Convert_1246743" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1742" name="self.model.model.decoder.layers.4.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1743" name="self.model.model.decoder.layers.4.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="113477088" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1744" name="self.model.model.decoder.layers.4.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1745" name="Constant_1246748" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1746" name="Reshape_1246749" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1747" name="self.model.model.decoder.layers.4.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1748" name="__module.model.model.decoder.layers.4.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1749" name="Constant_54578" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="113493472" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1750" name="__module.model.model.decoder.layers.4.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="861,tensor.55"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1751" name="Constant_57993" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1752" name="__module.model.model.decoder.layers.4.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="863"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1753" name="__module.model.model.decoder.layers.4.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1754" name="__module.model.model.decoder.layers.4.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="864"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1755" name="__module.model.model.decoder.layers.4.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="879,attn_output.37"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1756" name="__module.model.model.decoder.layers.4.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1757" name="__module.model.model.decoder.layers.4.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="880,attn_output.39"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1758" name="Constant_57996" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1759" name="__module.model.model.decoder.layers.4.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="882"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1760" name="self.model.model.decoder.layers.4.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="113497568" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1761" name="Convert_1251039" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1762" name="self.model.model.decoder.layers.4.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="114021856" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1763" name="Convert_1251042" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1764" name="self.model.model.decoder.layers.4.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1765" name="self.model.model.decoder.layers.4.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="114025952" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1766" name="self.model.model.decoder.layers.4.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1767" name="Constant_1251047" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1768" name="Reshape_1251048" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1769" name="self.model.model.decoder.layers.4.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1770" name="__module.model.model.decoder.layers.4.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1771" name="Constant_54580" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="114042336" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1772" name="__module.model.model.decoder.layers.4.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="885,input.37"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1773" name="__module.model.model.decoder.layers.4/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="887,residual.29"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1774" name="__module.model.model.decoder.layers.4.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1775" name="__module.model.model.decoder.layers.4.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1776" name="Constant_54581" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="114046432" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1777" name="__module.model.model.decoder.layers.4.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1778" name="Constant_54582" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="114050528" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1779" name="__module.model.model.decoder.layers.4.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="891"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1780" name="self.model.model.decoder.layers.4.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="114054624" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1781" name="Convert_748056" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1782" name="self.model.model.decoder.layers.4.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="116151776" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1783" name="Convert_748059" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1784" name="self.model.model.decoder.layers.4.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1785" name="self.model.model.decoder.layers.4.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="116168160" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1786" name="self.model.model.decoder.layers.4.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1787" name="Constant_748064" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1788" name="Reshape_748065" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1789" name="self.model.model.decoder.layers.4.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1790" name="__module.model.model.decoder.layers.4.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1791" name="Constant_54583" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="116233696" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1792" name="__module.model.model.decoder.layers.4.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="894"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1793" name="__module.model.model.decoder.layers.4.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="895,input.39"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1794" name="self.model.model.decoder.layers.4.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="116250080" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1795" name="Convert_752355" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1796" name="self.model.model.decoder.layers.4.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="118347232" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1797" name="Convert_752358" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1798" name="self.model.model.decoder.layers.4.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1799" name="self.model.model.decoder.layers.4.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="118363616" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1800" name="self.model.model.decoder.layers.4.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1801" name="Constant_752363" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1802" name="Reshape_752364" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1803" name="self.model.model.decoder.layers.4.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1804" name="__module.model.model.decoder.layers.4.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1805" name="Constant_54584" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="118429152" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1806" name="__module.model.model.decoder.layers.4.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="899,input.41"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1807" name="__module.model.model.decoder.layers.4/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="901,903,residual.31"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1808" name="__module.model.model.decoder.layers.5.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1809" name="__module.model.model.decoder.layers.5.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1810" name="Constant_54585" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="118433248" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1811" name="__module.model.model.decoder.layers.5.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1812" name="Constant_54586" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="118437344" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1813" name="__module.model.model.decoder.layers.5.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="916,hidden_states.51"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1814" name="self.model.model.decoder.layers.5.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="118441440" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1815" name="Convert_1263936" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1816" name="self.model.model.decoder.layers.5.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="118965728" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1817" name="Convert_1263939" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1818" name="self.model.model.decoder.layers.5.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1819" name="self.model.model.decoder.layers.5.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="118969824" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1820" name="self.model.model.decoder.layers.5.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1821" name="Constant_1263944" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1822" name="Reshape_1263945" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1823" name="self.model.model.decoder.layers.5.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1824" name="__module.model.model.decoder.layers.5.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1825" name="Constant_54587" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="118986208" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1826" name="__module.model.model.decoder.layers.5.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="925,tensor.61"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1827" name="Constant_57997" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1828" name="__module.model.model.decoder.layers.5.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="927"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1829" name="__module.model.model.decoder.layers.5.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1830" name="__module.model.model.decoder.layers.5.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="928"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1831" name="Constant_60577" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1832" name="Constant_60570" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1833" name="Constant_60572" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1834" name="Constant_60574" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1835" name="Concat_60575" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1836" name="Broadcast_60578" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1837" name="ReadValue_60017" type="ReadValue" version="opset6"> <data variable_id="past_key_values.5.decoder.keypresent.5.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.5.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1838" name="Constant_59446" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1839" name="Gather_59447" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1840" name="self.model.model.decoder.layers.5.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="118990304" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1841" name="Convert_1259637" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1842" name="self.model.model.decoder.layers.5.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="119514592" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1843" name="Convert_1259640" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1844" name="self.model.model.decoder.layers.5.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1845" name="self.model.model.decoder.layers.5.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="119518688" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1846" name="self.model.model.decoder.layers.5.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1847" name="Constant_1259645" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1848" name="Reshape_1259646" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1849" name="self.model.model.decoder.layers.5.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1850" name="__module.model.model.decoder.layers.5.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="931,tensor.63"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1851" name="Constant_57998" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1852" name="__module.model.model.decoder.layers.5.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="933"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1853" name="__module.model.model.decoder.layers.5.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1854" name="__module.model.model.decoder.layers.5.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="934"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1855" name="__module.model.model.decoder.layers.5.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.19"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1856" name="Constant_60565" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="1857" name="Constant_60558" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1858" name="Constant_60560" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1859" name="Constant_60562" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1860" name="Concat_60563" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1861" name="Broadcast_60566" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="1862" name="ReadValue_60019" type="ReadValue" version="opset6"> <data variable_id="past_key_values.5.decoder.valuepresent.5.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.5.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1863" name="Constant_59449" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1864" name="Gather_59450" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1865" name="self.model.model.decoder.layers.5.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="119535072" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1866" name="Convert_1255338" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1867" name="self.model.model.decoder.layers.5.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="120059360" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1868" name="Convert_1255341" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1869" name="self.model.model.decoder.layers.5.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1870" name="self.model.model.decoder.layers.5.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="120063456" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1871" name="self.model.model.decoder.layers.5.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1872" name="Constant_1255346" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1873" name="Reshape_1255347" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1874" name="self.model.model.decoder.layers.5.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1875" name="__module.model.model.decoder.layers.5.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1876" name="Constant_54588" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="120079840" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1877" name="__module.model.model.decoder.layers.5.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="938,tensor.65"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1878" name="Constant_57999" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1879" name="__module.model.model.decoder.layers.5.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="940"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1880" name="__module.model.model.decoder.layers.5.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1881" name="__module.model.model.decoder.layers.5.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="941"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1882" name="__module.model.model.decoder.layers.5.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1883" name="__module.model.model.decoder.layers.5.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="952,attn_output.41"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1884" name="__module.model.model.decoder.layers.5.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1885" name="__module.model.model.decoder.layers.5.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="953,attn_output.43"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1886" name="Constant_58000" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1887" name="__module.model.model.decoder.layers.5.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="955"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1888" name="self.model.model.decoder.layers.5.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="120083936" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1889" name="Convert_1268235" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1890" name="self.model.model.decoder.layers.5.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="120608224" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1891" name="Convert_1268238" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1892" name="self.model.model.decoder.layers.5.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1893" name="self.model.model.decoder.layers.5.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="120612320" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1894" name="self.model.model.decoder.layers.5.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1895" name="Constant_1268243" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1896" name="Reshape_1268244" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1897" name="self.model.model.decoder.layers.5.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1898" name="__module.model.model.decoder.layers.5.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1899" name="Constant_54589" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="120628704" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1900" name="__module.model.model.decoder.layers.5.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="958,960,input.43"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1901" name="__module.model.model.decoder.layers.5/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="964,residual.33"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1902" name="__module.model.model.decoder.layers.5.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1903" name="__module.model.model.decoder.layers.5.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1904" name="Constant_54590" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="120632800" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1905" name="__module.model.model.decoder.layers.5.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1906" name="Constant_54591" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="120636896" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1907" name="__module.model.model.decoder.layers.5.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="968,hidden_states.55"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1908" name="self.model.model.decoder.layers.5.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="120640992" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1909" name="Convert_1272534" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1910" name="self.model.model.decoder.layers.5.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="121165280" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1911" name="Convert_1272537" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1912" name="self.model.model.decoder.layers.5.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1913" name="self.model.model.decoder.layers.5.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="121169376" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1914" name="self.model.model.decoder.layers.5.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1915" name="Constant_1272542" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1916" name="Reshape_1272543" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1917" name="self.model.model.decoder.layers.5.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1918" name="__module.model.model.decoder.layers.5.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1919" name="Constant_54592" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="121185760" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1920" name="__module.model.model.decoder.layers.5.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="977,tensor.67"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1921" name="Constant_58001" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1922" name="__module.model.model.decoder.layers.5.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="979"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1923" name="__module.model.model.decoder.layers.5.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1924" name="__module.model.model.decoder.layers.5.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="980"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1925" name="__module.model.model.decoder.layers.5.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="995,attn_output.45"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="1926" name="__module.model.model.decoder.layers.5.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1927" name="__module.model.model.decoder.layers.5.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="996,attn_output.47"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1928" name="Constant_58004" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1929" name="__module.model.model.decoder.layers.5.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="998"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1930" name="self.model.model.decoder.layers.5.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="121189856" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1931" name="Convert_1276833" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1932" name="self.model.model.decoder.layers.5.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="121714144" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1933" name="Convert_1276836" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1934" name="self.model.model.decoder.layers.5.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1935" name="self.model.model.decoder.layers.5.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="121718240" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1936" name="self.model.model.decoder.layers.5.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1937" name="Constant_1276841" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1938" name="Reshape_1276842" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1939" name="self.model.model.decoder.layers.5.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1940" name="__module.model.model.decoder.layers.5.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1941" name="Constant_54594" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="121734624" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1942" name="__module.model.model.decoder.layers.5.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1001,input.45"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1943" name="__module.model.model.decoder.layers.5/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1003,residual.35"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1944" name="__module.model.model.decoder.layers.5.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1945" name="__module.model.model.decoder.layers.5.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1946" name="Constant_54595" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="121738720" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1947" name="__module.model.model.decoder.layers.5.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1948" name="Constant_54596" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="121742816" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1949" name="__module.model.model.decoder.layers.5.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1007"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1950" name="self.model.model.decoder.layers.5.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="121746912" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1951" name="Convert_756654" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1952" name="self.model.model.decoder.layers.5.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="123844064" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1953" name="Convert_756657" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1954" name="self.model.model.decoder.layers.5.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1955" name="self.model.model.decoder.layers.5.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="123860448" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1956" name="self.model.model.decoder.layers.5.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1957" name="Constant_756662" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1958" name="Reshape_756663" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1959" name="self.model.model.decoder.layers.5.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1960" name="__module.model.model.decoder.layers.5.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1961" name="Constant_54597" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="123925984" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1962" name="__module.model.model.decoder.layers.5.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="1010"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1963" name="__module.model.model.decoder.layers.5.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="1011,input.47"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1964" name="self.model.model.decoder.layers.5.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="123942368" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1965" name="Convert_760953" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1966" name="self.model.model.decoder.layers.5.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="126039520" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1967" name="Convert_760956" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1968" name="self.model.model.decoder.layers.5.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1969" name="self.model.model.decoder.layers.5.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="126055904" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="1970" name="self.model.model.decoder.layers.5.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="1971" name="Constant_760961" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1972" name="Reshape_760962" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1973" name="self.model.model.decoder.layers.5.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="1974" name="__module.model.model.decoder.layers.5.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1975" name="Constant_54598" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="126121440" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1976" name="__module.model.model.decoder.layers.5.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1015,input.49"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1977" name="__module.model.model.decoder.layers.5/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1017,1019,residual.37"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1978" name="__module.model.model.decoder.layers.6.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="1979" name="__module.model.model.decoder.layers.6.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1980" name="Constant_54599" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="126125536" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1981" name="__module.model.model.decoder.layers.6.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1982" name="Constant_54600" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="126129632" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1983" name="__module.model.model.decoder.layers.6.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1032,hidden_states.61"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1984" name="self.model.model.decoder.layers.6.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="126133728" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1985" name="Convert_1289730" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1986" name="self.model.model.decoder.layers.6.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="126658016" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1987" name="Convert_1289733" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1988" name="self.model.model.decoder.layers.6.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1989" name="self.model.model.decoder.layers.6.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="126662112" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="1990" name="self.model.model.decoder.layers.6.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="1991" name="Constant_1289738" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="1992" name="Reshape_1289739" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1993" name="self.model.model.decoder.layers.6.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1994" name="__module.model.model.decoder.layers.6.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1995" name="Constant_54601" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="126678496" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1996" name="__module.model.model.decoder.layers.6.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1041,tensor.73"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="1997" name="Constant_58005" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1998" name="__module.model.model.decoder.layers.6.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1043"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="1999" name="__module.model.model.decoder.layers.6.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2000" name="__module.model.model.decoder.layers.6.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1044"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2001" name="Constant_60601" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2002" name="Constant_60594" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2003" name="Constant_60596" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2004" name="Constant_60598" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2005" name="Concat_60599" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2006" name="Broadcast_60602" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2007" name="ReadValue_60021" type="ReadValue" version="opset6"> <data variable_id="past_key_values.6.decoder.keypresent.6.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.6.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2008" name="Constant_59452" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2009" name="Gather_59453" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2010" name="self.model.model.decoder.layers.6.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="126682592" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2011" name="Convert_1285431" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2012" name="self.model.model.decoder.layers.6.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="127206880" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2013" name="Convert_1285434" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2014" name="self.model.model.decoder.layers.6.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2015" name="self.model.model.decoder.layers.6.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="127210976" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2016" name="self.model.model.decoder.layers.6.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2017" name="Constant_1285439" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2018" name="Reshape_1285440" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2019" name="self.model.model.decoder.layers.6.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2020" name="__module.model.model.decoder.layers.6.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1047,tensor.75"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2021" name="Constant_58006" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2022" name="__module.model.model.decoder.layers.6.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1049"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2023" name="__module.model.model.decoder.layers.6.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2024" name="__module.model.model.decoder.layers.6.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1050"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2025" name="__module.model.model.decoder.layers.6.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.21"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2026" name="Constant_60589" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2027" name="Constant_60582" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2028" name="Constant_60584" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2029" name="Constant_60586" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2030" name="Concat_60587" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2031" name="Broadcast_60590" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2032" name="ReadValue_60023" type="ReadValue" version="opset6"> <data variable_id="past_key_values.6.decoder.valuepresent.6.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.6.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2033" name="Constant_59455" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2034" name="Gather_59456" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2035" name="self.model.model.decoder.layers.6.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="127227360" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2036" name="Convert_1281132" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2037" name="self.model.model.decoder.layers.6.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="127751648" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2038" name="Convert_1281135" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2039" name="self.model.model.decoder.layers.6.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2040" name="self.model.model.decoder.layers.6.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="127755744" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2041" name="self.model.model.decoder.layers.6.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2042" name="Constant_1281140" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2043" name="Reshape_1281141" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2044" name="self.model.model.decoder.layers.6.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2045" name="__module.model.model.decoder.layers.6.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2046" name="Constant_54602" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="127772128" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2047" name="__module.model.model.decoder.layers.6.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1054,tensor.77"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2048" name="Constant_58007" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2049" name="__module.model.model.decoder.layers.6.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1056"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2050" name="__module.model.model.decoder.layers.6.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2051" name="__module.model.model.decoder.layers.6.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1057"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2052" name="__module.model.model.decoder.layers.6.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2053" name="__module.model.model.decoder.layers.6.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1068,attn_output.49"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2054" name="__module.model.model.decoder.layers.6.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2055" name="__module.model.model.decoder.layers.6.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1069,attn_output.51"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2056" name="Constant_58008" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2057" name="__module.model.model.decoder.layers.6.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1071"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2058" name="self.model.model.decoder.layers.6.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="127776224" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2059" name="Convert_1294029" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2060" name="self.model.model.decoder.layers.6.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="128300512" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2061" name="Convert_1294032" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2062" name="self.model.model.decoder.layers.6.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2063" name="self.model.model.decoder.layers.6.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="128304608" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2064" name="self.model.model.decoder.layers.6.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2065" name="Constant_1294037" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2066" name="Reshape_1294038" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2067" name="self.model.model.decoder.layers.6.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2068" name="__module.model.model.decoder.layers.6.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2069" name="Constant_54603" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="128320992" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2070" name="__module.model.model.decoder.layers.6.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1074,1076,input.51"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2071" name="__module.model.model.decoder.layers.6/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1080,residual.39"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2072" name="__module.model.model.decoder.layers.6.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2073" name="__module.model.model.decoder.layers.6.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2074" name="Constant_54604" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="128325088" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2075" name="__module.model.model.decoder.layers.6.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2076" name="Constant_54605" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="128329184" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2077" name="__module.model.model.decoder.layers.6.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1084,hidden_states.65"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2078" name="self.model.model.decoder.layers.6.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="128333280" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2079" name="Convert_1298328" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2080" name="self.model.model.decoder.layers.6.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="128857568" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2081" name="Convert_1298331" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2082" name="self.model.model.decoder.layers.6.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2083" name="self.model.model.decoder.layers.6.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="128861664" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2084" name="self.model.model.decoder.layers.6.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2085" name="Constant_1298336" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2086" name="Reshape_1298337" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2087" name="self.model.model.decoder.layers.6.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2088" name="__module.model.model.decoder.layers.6.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2089" name="Constant_54606" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="128878048" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2090" name="__module.model.model.decoder.layers.6.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1093,tensor.79"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2091" name="Constant_58009" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2092" name="__module.model.model.decoder.layers.6.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1095"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2093" name="__module.model.model.decoder.layers.6.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2094" name="__module.model.model.decoder.layers.6.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1096"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2095" name="__module.model.model.decoder.layers.6.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="1111,attn_output.53"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2096" name="__module.model.model.decoder.layers.6.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2097" name="__module.model.model.decoder.layers.6.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1112,attn_output.55"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2098" name="Constant_58012" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2099" name="__module.model.model.decoder.layers.6.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1114"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2100" name="self.model.model.decoder.layers.6.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="128882144" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2101" name="Convert_1302627" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2102" name="self.model.model.decoder.layers.6.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="129406432" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2103" name="Convert_1302630" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2104" name="self.model.model.decoder.layers.6.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2105" name="self.model.model.decoder.layers.6.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="129410528" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2106" name="self.model.model.decoder.layers.6.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2107" name="Constant_1302635" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2108" name="Reshape_1302636" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2109" name="self.model.model.decoder.layers.6.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2110" name="__module.model.model.decoder.layers.6.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2111" name="Constant_54608" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="129426912" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2112" name="__module.model.model.decoder.layers.6.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1117,input.53"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2113" name="__module.model.model.decoder.layers.6/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1119,residual.41"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2114" name="__module.model.model.decoder.layers.6.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2115" name="__module.model.model.decoder.layers.6.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2116" name="Constant_54609" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="129431008" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2117" name="__module.model.model.decoder.layers.6.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2118" name="Constant_54610" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="129435104" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2119" name="__module.model.model.decoder.layers.6.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1123"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2120" name="self.model.model.decoder.layers.6.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="129439200" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2121" name="Convert_765252" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2122" name="self.model.model.decoder.layers.6.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="131536352" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2123" name="Convert_765255" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2124" name="self.model.model.decoder.layers.6.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2125" name="self.model.model.decoder.layers.6.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="131552736" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2126" name="self.model.model.decoder.layers.6.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2127" name="Constant_765260" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2128" name="Reshape_765261" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2129" name="self.model.model.decoder.layers.6.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2130" name="__module.model.model.decoder.layers.6.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2131" name="Constant_54611" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="131618272" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2132" name="__module.model.model.decoder.layers.6.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="1126"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2133" name="__module.model.model.decoder.layers.6.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="1127,input.55"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2134" name="self.model.model.decoder.layers.6.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="131634656" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2135" name="Convert_769551" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2136" name="self.model.model.decoder.layers.6.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="133731808" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2137" name="Convert_769554" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2138" name="self.model.model.decoder.layers.6.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2139" name="self.model.model.decoder.layers.6.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="133748192" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2140" name="self.model.model.decoder.layers.6.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2141" name="Constant_769559" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2142" name="Reshape_769560" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2143" name="self.model.model.decoder.layers.6.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2144" name="__module.model.model.decoder.layers.6.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2145" name="Constant_54612" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="133813728" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2146" name="__module.model.model.decoder.layers.6.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1131,input.57"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2147" name="__module.model.model.decoder.layers.6/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1133,1135,residual.43"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2148" name="__module.model.model.decoder.layers.7.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2149" name="__module.model.model.decoder.layers.7.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2150" name="Constant_54613" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="133817824" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2151" name="__module.model.model.decoder.layers.7.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2152" name="Constant_54614" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="133821920" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2153" name="__module.model.model.decoder.layers.7.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1148,hidden_states.71"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2154" name="self.model.model.decoder.layers.7.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="133826016" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2155" name="Convert_1315524" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2156" name="self.model.model.decoder.layers.7.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="134350304" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2157" name="Convert_1315527" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2158" name="self.model.model.decoder.layers.7.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2159" name="self.model.model.decoder.layers.7.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="134354400" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2160" name="self.model.model.decoder.layers.7.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2161" name="Constant_1315532" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2162" name="Reshape_1315533" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2163" name="self.model.model.decoder.layers.7.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2164" name="__module.model.model.decoder.layers.7.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2165" name="Constant_54615" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="134370784" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2166" name="__module.model.model.decoder.layers.7.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1157,tensor.85"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2167" name="Constant_58013" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2168" name="__module.model.model.decoder.layers.7.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1159"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2169" name="__module.model.model.decoder.layers.7.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2170" name="__module.model.model.decoder.layers.7.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1160"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2171" name="Constant_60625" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2172" name="Constant_60618" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2173" name="Constant_60620" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2174" name="Constant_60622" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2175" name="Concat_60623" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2176" name="Broadcast_60626" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2177" name="ReadValue_60025" type="ReadValue" version="opset6"> <data variable_id="past_key_values.7.decoder.keypresent.7.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.7.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2178" name="Constant_59458" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2179" name="Gather_59459" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2180" name="self.model.model.decoder.layers.7.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="134374880" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2181" name="Convert_1311225" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2182" name="self.model.model.decoder.layers.7.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="134899168" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2183" name="Convert_1311228" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2184" name="self.model.model.decoder.layers.7.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2185" name="self.model.model.decoder.layers.7.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="134903264" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2186" name="self.model.model.decoder.layers.7.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2187" name="Constant_1311233" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2188" name="Reshape_1311234" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2189" name="self.model.model.decoder.layers.7.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2190" name="__module.model.model.decoder.layers.7.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1163,tensor.87"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2191" name="Constant_58014" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2192" name="__module.model.model.decoder.layers.7.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1165"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2193" name="__module.model.model.decoder.layers.7.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2194" name="__module.model.model.decoder.layers.7.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1166"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2195" name="__module.model.model.decoder.layers.7.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.23"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2196" name="Constant_60613" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2197" name="Constant_60606" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2198" name="Constant_60608" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2199" name="Constant_60610" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2200" name="Concat_60611" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2201" name="Broadcast_60614" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2202" name="ReadValue_60027" type="ReadValue" version="opset6"> <data variable_id="past_key_values.7.decoder.valuepresent.7.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.7.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2203" name="Constant_59461" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2204" name="Gather_59462" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2205" name="self.model.model.decoder.layers.7.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="134919648" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2206" name="Convert_1306926" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2207" name="self.model.model.decoder.layers.7.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="135443936" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2208" name="Convert_1306929" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2209" name="self.model.model.decoder.layers.7.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2210" name="self.model.model.decoder.layers.7.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="135448032" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2211" name="self.model.model.decoder.layers.7.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2212" name="Constant_1306934" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2213" name="Reshape_1306935" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2214" name="self.model.model.decoder.layers.7.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2215" name="__module.model.model.decoder.layers.7.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2216" name="Constant_54616" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="135464416" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2217" name="__module.model.model.decoder.layers.7.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1170,tensor.89"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2218" name="Constant_58015" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2219" name="__module.model.model.decoder.layers.7.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1172"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2220" name="__module.model.model.decoder.layers.7.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2221" name="__module.model.model.decoder.layers.7.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1173"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2222" name="__module.model.model.decoder.layers.7.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2223" name="__module.model.model.decoder.layers.7.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1184,attn_output.57"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2224" name="__module.model.model.decoder.layers.7.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2225" name="__module.model.model.decoder.layers.7.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1185,attn_output.59"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2226" name="Constant_58016" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2227" name="__module.model.model.decoder.layers.7.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1187"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2228" name="self.model.model.decoder.layers.7.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="135468512" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2229" name="Convert_1319823" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2230" name="self.model.model.decoder.layers.7.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="135992800" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2231" name="Convert_1319826" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2232" name="self.model.model.decoder.layers.7.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2233" name="self.model.model.decoder.layers.7.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="135996896" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2234" name="self.model.model.decoder.layers.7.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2235" name="Constant_1319831" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2236" name="Reshape_1319832" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2237" name="self.model.model.decoder.layers.7.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2238" name="__module.model.model.decoder.layers.7.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2239" name="Constant_54617" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="136013280" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2240" name="__module.model.model.decoder.layers.7.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1190,1192,input.59"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2241" name="__module.model.model.decoder.layers.7/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1196,residual.45"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2242" name="__module.model.model.decoder.layers.7.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2243" name="__module.model.model.decoder.layers.7.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2244" name="Constant_54618" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="136017376" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2245" name="__module.model.model.decoder.layers.7.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2246" name="Constant_54619" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="136021472" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2247" name="__module.model.model.decoder.layers.7.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1200,hidden_states.75"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2248" name="self.model.model.decoder.layers.7.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="136025568" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2249" name="Convert_1324122" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2250" name="self.model.model.decoder.layers.7.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="136549856" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2251" name="Convert_1324125" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2252" name="self.model.model.decoder.layers.7.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2253" name="self.model.model.decoder.layers.7.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="136553952" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2254" name="self.model.model.decoder.layers.7.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2255" name="Constant_1324130" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2256" name="Reshape_1324131" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2257" name="self.model.model.decoder.layers.7.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2258" name="__module.model.model.decoder.layers.7.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2259" name="Constant_54620" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="136570336" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2260" name="__module.model.model.decoder.layers.7.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1209,tensor.91"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2261" name="Constant_58017" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2262" name="__module.model.model.decoder.layers.7.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1211"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2263" name="__module.model.model.decoder.layers.7.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2264" name="__module.model.model.decoder.layers.7.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1212"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2265" name="__module.model.model.decoder.layers.7.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="1227,attn_output.61"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2266" name="__module.model.model.decoder.layers.7.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2267" name="__module.model.model.decoder.layers.7.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1228,attn_output.63"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2268" name="Constant_58020" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2269" name="__module.model.model.decoder.layers.7.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1230"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2270" name="self.model.model.decoder.layers.7.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="136574432" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2271" name="Convert_1328421" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2272" name="self.model.model.decoder.layers.7.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="137098720" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2273" name="Convert_1328424" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2274" name="self.model.model.decoder.layers.7.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2275" name="self.model.model.decoder.layers.7.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="137102816" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2276" name="self.model.model.decoder.layers.7.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2277" name="Constant_1328429" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2278" name="Reshape_1328430" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2279" name="self.model.model.decoder.layers.7.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2280" name="__module.model.model.decoder.layers.7.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2281" name="Constant_54622" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="137119200" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2282" name="__module.model.model.decoder.layers.7.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1233,input.61"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2283" name="__module.model.model.decoder.layers.7/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1235,residual.47"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2284" name="__module.model.model.decoder.layers.7.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2285" name="__module.model.model.decoder.layers.7.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2286" name="Constant_54623" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="137123296" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2287" name="__module.model.model.decoder.layers.7.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2288" name="Constant_54624" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="137127392" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2289" name="__module.model.model.decoder.layers.7.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1239"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2290" name="self.model.model.decoder.layers.7.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="137131488" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2291" name="Convert_773850" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2292" name="self.model.model.decoder.layers.7.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="139228640" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2293" name="Convert_773853" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2294" name="self.model.model.decoder.layers.7.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2295" name="self.model.model.decoder.layers.7.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="139245024" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2296" name="self.model.model.decoder.layers.7.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2297" name="Constant_773858" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2298" name="Reshape_773859" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2299" name="self.model.model.decoder.layers.7.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2300" name="__module.model.model.decoder.layers.7.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2301" name="Constant_54625" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="139310560" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2302" name="__module.model.model.decoder.layers.7.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="1242"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2303" name="__module.model.model.decoder.layers.7.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="1243,input.63"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2304" name="self.model.model.decoder.layers.7.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="139326944" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2305" name="Convert_778149" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2306" name="self.model.model.decoder.layers.7.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="141424096" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2307" name="Convert_778152" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2308" name="self.model.model.decoder.layers.7.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2309" name="self.model.model.decoder.layers.7.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="141440480" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2310" name="self.model.model.decoder.layers.7.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2311" name="Constant_778157" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2312" name="Reshape_778158" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2313" name="self.model.model.decoder.layers.7.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2314" name="__module.model.model.decoder.layers.7.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2315" name="Constant_54626" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="141506016" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2316" name="__module.model.model.decoder.layers.7.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1247,input.65"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2317" name="__module.model.model.decoder.layers.7/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1249,1251,residual.49"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2318" name="__module.model.model.decoder.layers.8.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2319" name="__module.model.model.decoder.layers.8.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2320" name="Constant_54627" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="141510112" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2321" name="__module.model.model.decoder.layers.8.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2322" name="Constant_54628" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="141514208" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2323" name="__module.model.model.decoder.layers.8.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1264,hidden_states.81"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2324" name="self.model.model.decoder.layers.8.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="141518304" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2325" name="Convert_1341318" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2326" name="self.model.model.decoder.layers.8.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="142042592" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2327" name="Convert_1341321" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2328" name="self.model.model.decoder.layers.8.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2329" name="self.model.model.decoder.layers.8.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="142046688" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2330" name="self.model.model.decoder.layers.8.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2331" name="Constant_1341326" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2332" name="Reshape_1341327" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2333" name="self.model.model.decoder.layers.8.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2334" name="__module.model.model.decoder.layers.8.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2335" name="Constant_54629" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="142063072" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2336" name="__module.model.model.decoder.layers.8.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1273,tensor.97"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2337" name="Constant_58021" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2338" name="__module.model.model.decoder.layers.8.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1275"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2339" name="__module.model.model.decoder.layers.8.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2340" name="__module.model.model.decoder.layers.8.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1276"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2341" name="Constant_60649" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2342" name="Constant_60642" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2343" name="Constant_60644" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2344" name="Constant_60646" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2345" name="Concat_60647" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2346" name="Broadcast_60650" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2347" name="ReadValue_60029" type="ReadValue" version="opset6"> <data variable_id="past_key_values.8.decoder.keypresent.8.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.8.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2348" name="Constant_59464" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2349" name="Gather_59465" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2350" name="self.model.model.decoder.layers.8.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="142067168" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2351" name="Convert_1337019" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2352" name="self.model.model.decoder.layers.8.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="142591456" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2353" name="Convert_1337022" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2354" name="self.model.model.decoder.layers.8.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2355" name="self.model.model.decoder.layers.8.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="142595552" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2356" name="self.model.model.decoder.layers.8.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2357" name="Constant_1337027" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2358" name="Reshape_1337028" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2359" name="self.model.model.decoder.layers.8.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2360" name="__module.model.model.decoder.layers.8.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1279,tensor.99"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2361" name="Constant_58022" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2362" name="__module.model.model.decoder.layers.8.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1281"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2363" name="__module.model.model.decoder.layers.8.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2364" name="__module.model.model.decoder.layers.8.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1282"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2365" name="__module.model.model.decoder.layers.8.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.25"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2366" name="Constant_60637" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2367" name="Constant_60630" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2368" name="Constant_60632" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2369" name="Constant_60634" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2370" name="Concat_60635" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2371" name="Broadcast_60638" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2372" name="ReadValue_60031" type="ReadValue" version="opset6"> <data variable_id="past_key_values.8.decoder.valuepresent.8.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.8.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2373" name="Constant_59467" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2374" name="Gather_59468" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2375" name="self.model.model.decoder.layers.8.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="142611936" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2376" name="Convert_1332720" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2377" name="self.model.model.decoder.layers.8.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="143136224" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2378" name="Convert_1332723" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2379" name="self.model.model.decoder.layers.8.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2380" name="self.model.model.decoder.layers.8.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="143140320" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2381" name="self.model.model.decoder.layers.8.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2382" name="Constant_1332728" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2383" name="Reshape_1332729" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2384" name="self.model.model.decoder.layers.8.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2385" name="__module.model.model.decoder.layers.8.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2386" name="Constant_54630" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="143156704" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2387" name="__module.model.model.decoder.layers.8.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1286,tensor.101"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2388" name="Constant_58023" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2389" name="__module.model.model.decoder.layers.8.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1288"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2390" name="__module.model.model.decoder.layers.8.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2391" name="__module.model.model.decoder.layers.8.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1289"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2392" name="__module.model.model.decoder.layers.8.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2393" name="__module.model.model.decoder.layers.8.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1300,attn_output.65"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2394" name="__module.model.model.decoder.layers.8.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2395" name="__module.model.model.decoder.layers.8.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1301,attn_output.67"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2396" name="Constant_58024" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2397" name="__module.model.model.decoder.layers.8.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1303"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2398" name="self.model.model.decoder.layers.8.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="143160800" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2399" name="Convert_1345617" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2400" name="self.model.model.decoder.layers.8.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="143685088" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2401" name="Convert_1345620" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2402" name="self.model.model.decoder.layers.8.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2403" name="self.model.model.decoder.layers.8.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="143689184" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2404" name="self.model.model.decoder.layers.8.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2405" name="Constant_1345625" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2406" name="Reshape_1345626" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2407" name="self.model.model.decoder.layers.8.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2408" name="__module.model.model.decoder.layers.8.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2409" name="Constant_54631" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="143705568" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2410" name="__module.model.model.decoder.layers.8.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1306,1308,input.67"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2411" name="__module.model.model.decoder.layers.8/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1312,residual.51"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2412" name="__module.model.model.decoder.layers.8.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2413" name="__module.model.model.decoder.layers.8.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2414" name="Constant_54632" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="143709664" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2415" name="__module.model.model.decoder.layers.8.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2416" name="Constant_54633" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="143713760" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2417" name="__module.model.model.decoder.layers.8.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1316,hidden_states.85"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2418" name="self.model.model.decoder.layers.8.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="143717856" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2419" name="Convert_1349916" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2420" name="self.model.model.decoder.layers.8.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="144242144" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2421" name="Convert_1349919" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2422" name="self.model.model.decoder.layers.8.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2423" name="self.model.model.decoder.layers.8.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="144246240" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2424" name="self.model.model.decoder.layers.8.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2425" name="Constant_1349924" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2426" name="Reshape_1349925" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2427" name="self.model.model.decoder.layers.8.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2428" name="__module.model.model.decoder.layers.8.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2429" name="Constant_54634" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="144262624" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2430" name="__module.model.model.decoder.layers.8.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1325,tensor.103"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2431" name="Constant_58025" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2432" name="__module.model.model.decoder.layers.8.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1327"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2433" name="__module.model.model.decoder.layers.8.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2434" name="__module.model.model.decoder.layers.8.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1328"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2435" name="__module.model.model.decoder.layers.8.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="1343,attn_output.69"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2436" name="__module.model.model.decoder.layers.8.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2437" name="__module.model.model.decoder.layers.8.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1344,attn_output.71"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2438" name="Constant_58028" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2439" name="__module.model.model.decoder.layers.8.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1346"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2440" name="self.model.model.decoder.layers.8.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="144266720" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2441" name="Convert_1354215" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2442" name="self.model.model.decoder.layers.8.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="144791008" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2443" name="Convert_1354218" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2444" name="self.model.model.decoder.layers.8.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2445" name="self.model.model.decoder.layers.8.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="144795104" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2446" name="self.model.model.decoder.layers.8.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2447" name="Constant_1354223" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2448" name="Reshape_1354224" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2449" name="self.model.model.decoder.layers.8.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2450" name="__module.model.model.decoder.layers.8.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2451" name="Constant_54636" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="144811488" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2452" name="__module.model.model.decoder.layers.8.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1349,input.69"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2453" name="__module.model.model.decoder.layers.8/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1351,residual.53"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2454" name="__module.model.model.decoder.layers.8.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2455" name="__module.model.model.decoder.layers.8.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2456" name="Constant_54637" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="144815584" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2457" name="__module.model.model.decoder.layers.8.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2458" name="Constant_54638" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="144819680" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2459" name="__module.model.model.decoder.layers.8.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1355"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2460" name="self.model.model.decoder.layers.8.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="144823776" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2461" name="Convert_782448" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2462" name="self.model.model.decoder.layers.8.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="146920928" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2463" name="Convert_782451" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2464" name="self.model.model.decoder.layers.8.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2465" name="self.model.model.decoder.layers.8.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="146937312" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2466" name="self.model.model.decoder.layers.8.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2467" name="Constant_782456" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2468" name="Reshape_782457" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2469" name="self.model.model.decoder.layers.8.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2470" name="__module.model.model.decoder.layers.8.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2471" name="Constant_54639" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="147002848" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2472" name="__module.model.model.decoder.layers.8.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="1358"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2473" name="__module.model.model.decoder.layers.8.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="1359,input.71"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2474" name="self.model.model.decoder.layers.8.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="147019232" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2475" name="Convert_786747" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2476" name="self.model.model.decoder.layers.8.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="149116384" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2477" name="Convert_786750" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2478" name="self.model.model.decoder.layers.8.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2479" name="self.model.model.decoder.layers.8.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="149132768" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2480" name="self.model.model.decoder.layers.8.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2481" name="Constant_786755" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2482" name="Reshape_786756" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2483" name="self.model.model.decoder.layers.8.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2484" name="__module.model.model.decoder.layers.8.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2485" name="Constant_54640" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="149198304" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2486" name="__module.model.model.decoder.layers.8.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1363,input.73"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2487" name="__module.model.model.decoder.layers.8/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1365,1367,residual.55"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2488" name="__module.model.model.decoder.layers.9.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2489" name="__module.model.model.decoder.layers.9.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2490" name="Constant_54641" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="149202400" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2491" name="__module.model.model.decoder.layers.9.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2492" name="Constant_54642" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="149206496" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2493" name="__module.model.model.decoder.layers.9.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1380,hidden_states.91"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2494" name="self.model.model.decoder.layers.9.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="149210592" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2495" name="Convert_1358514" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2496" name="self.model.model.decoder.layers.9.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="149734880" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2497" name="Convert_1358517" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2498" name="self.model.model.decoder.layers.9.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2499" name="self.model.model.decoder.layers.9.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="149738976" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2500" name="self.model.model.decoder.layers.9.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2501" name="Constant_1358522" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2502" name="Reshape_1358523" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2503" name="self.model.model.decoder.layers.9.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2504" name="__module.model.model.decoder.layers.9.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2505" name="Constant_54644" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="149755360" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2506" name="__module.model.model.decoder.layers.9.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1402,tensor.113"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2507" name="Constant_58031" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2508" name="__module.model.model.decoder.layers.9.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1404"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2509" name="__module.model.model.decoder.layers.9.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2510" name="__module.model.model.decoder.layers.9.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1405"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2511" name="__module.model.model.decoder.layers.9.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2513" name="Constant_60661" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2514" name="Constant_60654" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2515" name="Constant_60656" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2516" name="Constant_60658" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2517" name="Concat_60659" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2518" name="Broadcast_60662" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2519" name="ReadValue_60033" type="ReadValue" version="opset6"> <data variable_id="past_key_values.9.decoder.keypresent.9.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.9.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2520" name="Constant_59470" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2521" name="Gather_59471" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2522" name="self.model.model.decoder.layers.9.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="149759456" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2523" name="Convert_1362813" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2524" name="self.model.model.decoder.layers.9.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="150283744" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2525" name="Convert_1362816" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2526" name="self.model.model.decoder.layers.9.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2527" name="self.model.model.decoder.layers.9.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="150287840" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2528" name="self.model.model.decoder.layers.9.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2529" name="Constant_1362821" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2530" name="Reshape_1362822" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2531" name="self.model.model.decoder.layers.9.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2532" name="__module.model.model.decoder.layers.9.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1395,tensor.111"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2533" name="Constant_58030" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2534" name="__module.model.model.decoder.layers.9.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1397"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2535" name="__module.model.model.decoder.layers.9.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2536" name="__module.model.model.decoder.layers.9.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1398"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2537" name="__module.model.model.decoder.layers.9.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.27"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2551" name="Constant_60673" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2552" name="Constant_60666" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2553" name="Constant_60668" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2554" name="Constant_60670" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2555" name="Concat_60671" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2556" name="Broadcast_60674" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2557" name="ReadValue_60007" type="ReadValue" version="opset6"> <data variable_id="past_key_values.23.decoder.valuepresent.23.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.23.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2558" name="Constant_59557" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2559" name="Gather_59558" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2560" name="self.model.model.decoder.layers.9.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="150304224" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2561" name="Convert_1367112" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2562" name="self.model.model.decoder.layers.9.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="150828512" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2563" name="Convert_1367115" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2564" name="self.model.model.decoder.layers.9.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2565" name="self.model.model.decoder.layers.9.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="150832608" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2566" name="self.model.model.decoder.layers.9.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2567" name="Constant_1367120" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2568" name="Reshape_1367121" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2569" name="self.model.model.decoder.layers.9.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2570" name="__module.model.model.decoder.layers.9.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2571" name="Constant_54643" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="150848992" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2572" name="__module.model.model.decoder.layers.9.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1389,tensor.109"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2573" name="Constant_58029" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2574" name="__module.model.model.decoder.layers.9.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1391"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2575" name="__module.model.model.decoder.layers.9.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2576" name="__module.model.model.decoder.layers.9.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1392"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2577" name="__module.model.model.decoder.layers.9.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1416,attn_output.73"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2578" name="__module.model.model.decoder.layers.9.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2579" name="__module.model.model.decoder.layers.9.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1417,attn_output.75"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2580" name="Constant_58032" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2581" name="__module.model.model.decoder.layers.9.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1419"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2582" name="self.model.model.decoder.layers.9.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="150853088" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2583" name="Convert_1371411" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2584" name="self.model.model.decoder.layers.9.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="151377376" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2585" name="Convert_1371414" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2586" name="self.model.model.decoder.layers.9.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2587" name="self.model.model.decoder.layers.9.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="151381472" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2588" name="self.model.model.decoder.layers.9.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2589" name="Constant_1371419" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2590" name="Reshape_1371420" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2591" name="self.model.model.decoder.layers.9.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2592" name="__module.model.model.decoder.layers.9.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2593" name="Constant_54645" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="151397856" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2594" name="__module.model.model.decoder.layers.9.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1422,1424,input.75"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2595" name="__module.model.model.decoder.layers.9/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1428,residual.57"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2596" name="__module.model.model.decoder.layers.9.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2597" name="__module.model.model.decoder.layers.9.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2598" name="Constant_54646" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="151401952" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2599" name="__module.model.model.decoder.layers.9.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2600" name="Constant_54647" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="151406048" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2601" name="__module.model.model.decoder.layers.9.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1432,hidden_states.95"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2602" name="self.model.model.decoder.layers.9.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="151410144" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2603" name="Convert_1375710" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2604" name="self.model.model.decoder.layers.9.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="151934432" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2605" name="Convert_1375713" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2606" name="self.model.model.decoder.layers.9.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2607" name="self.model.model.decoder.layers.9.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="151938528" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2608" name="self.model.model.decoder.layers.9.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2609" name="Constant_1375718" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2610" name="Reshape_1375719" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2611" name="self.model.model.decoder.layers.9.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2612" name="__module.model.model.decoder.layers.9.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2613" name="Constant_54648" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="151954912" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2614" name="__module.model.model.decoder.layers.9.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1441,tensor.115"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2615" name="Constant_58033" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2616" name="__module.model.model.decoder.layers.9.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1443"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2617" name="__module.model.model.decoder.layers.9.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2618" name="__module.model.model.decoder.layers.9.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1444"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2619" name="__module.model.model.decoder.layers.9.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="1459,attn_output.77"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2620" name="__module.model.model.decoder.layers.9.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2621" name="__module.model.model.decoder.layers.9.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1460,attn_output.79"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2622" name="Constant_58036" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2623" name="__module.model.model.decoder.layers.9.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1462"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2624" name="self.model.model.decoder.layers.9.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="151959008" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2625" name="Convert_1380009" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2626" name="self.model.model.decoder.layers.9.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="152483296" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2627" name="Convert_1380012" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2628" name="self.model.model.decoder.layers.9.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2629" name="self.model.model.decoder.layers.9.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="152487392" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2630" name="self.model.model.decoder.layers.9.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2631" name="Constant_1380017" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2632" name="Reshape_1380018" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2633" name="self.model.model.decoder.layers.9.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2634" name="__module.model.model.decoder.layers.9.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2635" name="Constant_54650" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="152503776" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2636" name="__module.model.model.decoder.layers.9.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1465,input.77"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2637" name="__module.model.model.decoder.layers.9/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1467,residual.59"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2638" name="__module.model.model.decoder.layers.9.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2639" name="__module.model.model.decoder.layers.9.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2640" name="Constant_54651" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="152507872" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2641" name="__module.model.model.decoder.layers.9.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2642" name="Constant_54652" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="152511968" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2643" name="__module.model.model.decoder.layers.9.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1471"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2644" name="self.model.model.decoder.layers.9.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="152516064" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2645" name="Convert_791046" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2646" name="self.model.model.decoder.layers.9.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="154613216" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2647" name="Convert_791049" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2648" name="self.model.model.decoder.layers.9.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2649" name="self.model.model.decoder.layers.9.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="154629600" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2650" name="self.model.model.decoder.layers.9.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2651" name="Constant_791054" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2652" name="Reshape_791055" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2653" name="self.model.model.decoder.layers.9.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2654" name="__module.model.model.decoder.layers.9.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2655" name="Constant_54653" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="154695136" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2656" name="__module.model.model.decoder.layers.9.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="1474"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2657" name="__module.model.model.decoder.layers.9.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="1475,input.79"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2658" name="self.model.model.decoder.layers.9.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="154711520" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2659" name="Convert_795345" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2660" name="self.model.model.decoder.layers.9.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="156808672" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2661" name="Convert_795348" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2662" name="self.model.model.decoder.layers.9.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2663" name="self.model.model.decoder.layers.9.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="156825056" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2664" name="self.model.model.decoder.layers.9.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2665" name="Constant_795353" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2666" name="Reshape_795354" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2667" name="self.model.model.decoder.layers.9.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2668" name="__module.model.model.decoder.layers.9.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2669" name="Constant_54654" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="156890592" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2670" name="__module.model.model.decoder.layers.9.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1479,input.81"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2671" name="__module.model.model.decoder.layers.9/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1481,1483,residual.61"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2672" name="__module.model.model.decoder.layers.10.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2673" name="__module.model.model.decoder.layers.10.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2674" name="Constant_54655" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="156894688" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2675" name="__module.model.model.decoder.layers.10.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2676" name="Constant_54656" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="156898784" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2677" name="__module.model.model.decoder.layers.10.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1496,hidden_states.101"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2678" name="self.model.model.decoder.layers.10.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="156902880" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2679" name="Convert_1392906" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2680" name="self.model.model.decoder.layers.10.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="157427168" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2681" name="Convert_1392909" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2682" name="self.model.model.decoder.layers.10.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2683" name="self.model.model.decoder.layers.10.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="157431264" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2684" name="self.model.model.decoder.layers.10.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2685" name="Constant_1392914" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2686" name="Reshape_1392915" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2687" name="self.model.model.decoder.layers.10.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2688" name="__module.model.model.decoder.layers.10.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2689" name="Constant_54657" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="157447648" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2690" name="__module.model.model.decoder.layers.10.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1505,tensor.121"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2691" name="Constant_58037" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2692" name="__module.model.model.decoder.layers.10.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1507"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2693" name="__module.model.model.decoder.layers.10.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2694" name="__module.model.model.decoder.layers.10.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1508"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2695" name="Constant_60697" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2696" name="Constant_60690" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2697" name="Constant_60692" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2698" name="Constant_60694" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2699" name="Concat_60695" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2700" name="Broadcast_60698" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2701" name="ReadValue_59949" type="ReadValue" version="opset6"> <data variable_id="past_key_values.10.decoder.keypresent.10.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.10.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2702" name="Constant_59476" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2703" name="Gather_59477" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2704" name="self.model.model.decoder.layers.10.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="157451744" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2705" name="Convert_1388607" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2706" name="self.model.model.decoder.layers.10.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="157976032" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2707" name="Convert_1388610" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2708" name="self.model.model.decoder.layers.10.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2709" name="self.model.model.decoder.layers.10.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="157980128" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2710" name="self.model.model.decoder.layers.10.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2711" name="Constant_1388615" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2712" name="Reshape_1388616" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2713" name="self.model.model.decoder.layers.10.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2714" name="__module.model.model.decoder.layers.10.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1511,tensor.123"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2715" name="Constant_58038" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2716" name="__module.model.model.decoder.layers.10.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1513"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2717" name="__module.model.model.decoder.layers.10.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2718" name="__module.model.model.decoder.layers.10.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1514"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2719" name="__module.model.model.decoder.layers.10.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.29"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2720" name="Constant_60685" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2721" name="Constant_60678" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2722" name="Constant_60680" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2723" name="Constant_60682" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2724" name="Concat_60683" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2725" name="Broadcast_60686" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2726" name="ReadValue_59951" type="ReadValue" version="opset6"> <data variable_id="past_key_values.10.decoder.valuepresent.10.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.10.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2727" name="Constant_59479" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2728" name="Gather_59480" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2729" name="self.model.model.decoder.layers.10.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="157996512" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2730" name="Convert_1384308" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2731" name="self.model.model.decoder.layers.10.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="158520800" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2732" name="Convert_1384311" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2733" name="self.model.model.decoder.layers.10.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2734" name="self.model.model.decoder.layers.10.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="158524896" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2735" name="self.model.model.decoder.layers.10.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2736" name="Constant_1384316" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2737" name="Reshape_1384317" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2738" name="self.model.model.decoder.layers.10.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2739" name="__module.model.model.decoder.layers.10.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2740" name="Constant_54658" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="158541280" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2741" name="__module.model.model.decoder.layers.10.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1518,tensor.125"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2742" name="Constant_58039" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2743" name="__module.model.model.decoder.layers.10.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1520"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2744" name="__module.model.model.decoder.layers.10.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2745" name="__module.model.model.decoder.layers.10.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1521"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2746" name="__module.model.model.decoder.layers.10.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2747" name="__module.model.model.decoder.layers.10.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1532,attn_output.81"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2748" name="__module.model.model.decoder.layers.10.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2749" name="__module.model.model.decoder.layers.10.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1533,attn_output.83"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2750" name="Constant_58040" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2751" name="__module.model.model.decoder.layers.10.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1535"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2752" name="self.model.model.decoder.layers.10.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="158545376" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2753" name="Convert_1397205" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2754" name="self.model.model.decoder.layers.10.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="159069664" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2755" name="Convert_1397208" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2756" name="self.model.model.decoder.layers.10.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2757" name="self.model.model.decoder.layers.10.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="159073760" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2758" name="self.model.model.decoder.layers.10.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2759" name="Constant_1397213" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2760" name="Reshape_1397214" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2761" name="self.model.model.decoder.layers.10.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2762" name="__module.model.model.decoder.layers.10.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2763" name="Constant_54659" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="159090144" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2764" name="__module.model.model.decoder.layers.10.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1538,1540,input.83"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2765" name="__module.model.model.decoder.layers.10/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1544,residual.63"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2766" name="__module.model.model.decoder.layers.10.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2767" name="__module.model.model.decoder.layers.10.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2768" name="Constant_54660" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="159094240" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2769" name="__module.model.model.decoder.layers.10.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2770" name="Constant_54661" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="159098336" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2771" name="__module.model.model.decoder.layers.10.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1548,hidden_states.105"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2772" name="self.model.model.decoder.layers.10.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="159102432" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2773" name="Convert_1401504" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2774" name="self.model.model.decoder.layers.10.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="159626720" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2775" name="Convert_1401507" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2776" name="self.model.model.decoder.layers.10.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2777" name="self.model.model.decoder.layers.10.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="159630816" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2778" name="self.model.model.decoder.layers.10.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2779" name="Constant_1401512" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2780" name="Reshape_1401513" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2781" name="self.model.model.decoder.layers.10.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2782" name="__module.model.model.decoder.layers.10.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2783" name="Constant_54662" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="159647200" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2784" name="__module.model.model.decoder.layers.10.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1557,tensor.127"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2785" name="Constant_58041" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2786" name="__module.model.model.decoder.layers.10.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1559"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2787" name="__module.model.model.decoder.layers.10.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2788" name="__module.model.model.decoder.layers.10.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1560"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2789" name="__module.model.model.decoder.layers.10.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="1575,attn_output.85"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2790" name="__module.model.model.decoder.layers.10.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2791" name="__module.model.model.decoder.layers.10.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1576,attn_output.87"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2792" name="Constant_58044" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2793" name="__module.model.model.decoder.layers.10.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1578"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2794" name="self.model.model.decoder.layers.10.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="159651296" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2795" name="Convert_1405803" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2796" name="self.model.model.decoder.layers.10.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="160175584" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2797" name="Convert_1405806" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2798" name="self.model.model.decoder.layers.10.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2799" name="self.model.model.decoder.layers.10.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="160179680" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2800" name="self.model.model.decoder.layers.10.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2801" name="Constant_1405811" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2802" name="Reshape_1405812" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2803" name="self.model.model.decoder.layers.10.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2804" name="__module.model.model.decoder.layers.10.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2805" name="Constant_54664" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="160196064" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2806" name="__module.model.model.decoder.layers.10.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1581,input.85"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2807" name="__module.model.model.decoder.layers.10/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1583,residual.65"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2808" name="__module.model.model.decoder.layers.10.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2809" name="__module.model.model.decoder.layers.10.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2810" name="Constant_54665" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="160200160" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2811" name="__module.model.model.decoder.layers.10.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2812" name="Constant_54666" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="160204256" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2813" name="__module.model.model.decoder.layers.10.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1587"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2814" name="self.model.model.decoder.layers.10.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="160208352" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2815" name="Convert_799644" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2816" name="self.model.model.decoder.layers.10.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="162305504" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2817" name="Convert_799647" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2818" name="self.model.model.decoder.layers.10.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2819" name="self.model.model.decoder.layers.10.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="162321888" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2820" name="self.model.model.decoder.layers.10.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2821" name="Constant_799652" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2822" name="Reshape_799653" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2823" name="self.model.model.decoder.layers.10.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2824" name="__module.model.model.decoder.layers.10.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2825" name="Constant_54667" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="162387424" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2826" name="__module.model.model.decoder.layers.10.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="1590"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2827" name="__module.model.model.decoder.layers.10.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="1591,input.87"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2828" name="self.model.model.decoder.layers.10.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="162403808" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2829" name="Convert_803943" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2830" name="self.model.model.decoder.layers.10.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="164500960" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2831" name="Convert_803946" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2832" name="self.model.model.decoder.layers.10.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2833" name="self.model.model.decoder.layers.10.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="164517344" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="2834" name="self.model.model.decoder.layers.10.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2835" name="Constant_803951" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2836" name="Reshape_803952" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2837" name="self.model.model.decoder.layers.10.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2838" name="__module.model.model.decoder.layers.10.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2839" name="Constant_54668" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="164582880" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2840" name="__module.model.model.decoder.layers.10.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1595,input.89"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2841" name="__module.model.model.decoder.layers.10/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1597,1599,residual.67"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2842" name="__module.model.model.decoder.layers.11.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2843" name="__module.model.model.decoder.layers.11.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2844" name="Constant_54669" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="164586976" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2845" name="__module.model.model.decoder.layers.11.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2846" name="Constant_54670" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="164591072" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2847" name="__module.model.model.decoder.layers.11.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1612,hidden_states.111"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2848" name="self.model.model.decoder.layers.11.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="164595168" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2849" name="Convert_1418700" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2850" name="self.model.model.decoder.layers.11.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="165119456" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2851" name="Convert_1418703" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2852" name="self.model.model.decoder.layers.11.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2853" name="self.model.model.decoder.layers.11.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="165123552" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2854" name="self.model.model.decoder.layers.11.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2855" name="Constant_1418708" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2856" name="Reshape_1418709" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2857" name="self.model.model.decoder.layers.11.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2858" name="__module.model.model.decoder.layers.11.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2859" name="Constant_54671" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="165139936" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2860" name="__module.model.model.decoder.layers.11.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1621,tensor.133"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2861" name="Constant_58045" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2862" name="__module.model.model.decoder.layers.11.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1623"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2863" name="__module.model.model.decoder.layers.11.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2864" name="__module.model.model.decoder.layers.11.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1624"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2865" name="Constant_60721" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2866" name="Constant_60714" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2867" name="Constant_60716" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2868" name="Constant_60718" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2869" name="Concat_60719" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2870" name="Broadcast_60722" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2871" name="ReadValue_59953" type="ReadValue" version="opset6"> <data variable_id="past_key_values.11.decoder.keypresent.11.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.11.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2872" name="Constant_59482" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2873" name="Gather_59483" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2874" name="self.model.model.decoder.layers.11.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="165144032" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2875" name="Convert_1414401" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2876" name="self.model.model.decoder.layers.11.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="165668320" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2877" name="Convert_1414404" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2878" name="self.model.model.decoder.layers.11.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2879" name="self.model.model.decoder.layers.11.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="165672416" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2880" name="self.model.model.decoder.layers.11.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2881" name="Constant_1414409" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2882" name="Reshape_1414410" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2883" name="self.model.model.decoder.layers.11.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2884" name="__module.model.model.decoder.layers.11.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1627,tensor.135"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2885" name="Constant_58046" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2886" name="__module.model.model.decoder.layers.11.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1629"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2887" name="__module.model.model.decoder.layers.11.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2888" name="__module.model.model.decoder.layers.11.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1630"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2889" name="__module.model.model.decoder.layers.11.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.31"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2890" name="Constant_60709" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="2891" name="Constant_60702" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2892" name="Constant_60704" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2893" name="Constant_60706" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2894" name="Concat_60707" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2895" name="Broadcast_60710" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="2896" name="ReadValue_59955" type="ReadValue" version="opset6"> <data variable_id="past_key_values.11.decoder.valuepresent.11.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.11.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2897" name="Constant_59485" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2898" name="Gather_59486" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2899" name="self.model.model.decoder.layers.11.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="165688800" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2900" name="Convert_1410102" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2901" name="self.model.model.decoder.layers.11.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="166213088" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2902" name="Convert_1410105" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2903" name="self.model.model.decoder.layers.11.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2904" name="self.model.model.decoder.layers.11.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="166217184" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2905" name="self.model.model.decoder.layers.11.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2906" name="Constant_1410110" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2907" name="Reshape_1410111" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2908" name="self.model.model.decoder.layers.11.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2909" name="__module.model.model.decoder.layers.11.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2910" name="Constant_54672" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="166233568" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2911" name="__module.model.model.decoder.layers.11.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1634,tensor.137"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2912" name="Constant_58047" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2913" name="__module.model.model.decoder.layers.11.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1636"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2914" name="__module.model.model.decoder.layers.11.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2915" name="__module.model.model.decoder.layers.11.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1637"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2916" name="__module.model.model.decoder.layers.11.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2917" name="__module.model.model.decoder.layers.11.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1648,attn_output.89"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2918" name="__module.model.model.decoder.layers.11.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2919" name="__module.model.model.decoder.layers.11.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1649,attn_output.91"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2920" name="Constant_58048" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2921" name="__module.model.model.decoder.layers.11.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1651"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2922" name="self.model.model.decoder.layers.11.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="166237664" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2923" name="Convert_1422999" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2924" name="self.model.model.decoder.layers.11.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="166761952" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2925" name="Convert_1423002" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2926" name="self.model.model.decoder.layers.11.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2927" name="self.model.model.decoder.layers.11.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="166766048" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2928" name="self.model.model.decoder.layers.11.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2929" name="Constant_1423007" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2930" name="Reshape_1423008" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2931" name="self.model.model.decoder.layers.11.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2932" name="__module.model.model.decoder.layers.11.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2933" name="Constant_54673" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="166782432" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2934" name="__module.model.model.decoder.layers.11.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1654,1656,input.91"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2935" name="__module.model.model.decoder.layers.11/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1660,residual.69"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2936" name="__module.model.model.decoder.layers.11.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2937" name="__module.model.model.decoder.layers.11.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2938" name="Constant_54674" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="166786528" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2939" name="__module.model.model.decoder.layers.11.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2940" name="Constant_54675" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="166790624" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2941" name="__module.model.model.decoder.layers.11.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1664,hidden_states.115"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2942" name="self.model.model.decoder.layers.11.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="166794720" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2943" name="Convert_1427298" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2944" name="self.model.model.decoder.layers.11.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="167319008" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2945" name="Convert_1427301" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2946" name="self.model.model.decoder.layers.11.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2947" name="self.model.model.decoder.layers.11.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="167323104" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2948" name="self.model.model.decoder.layers.11.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2949" name="Constant_1427306" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2950" name="Reshape_1427307" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2951" name="self.model.model.decoder.layers.11.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2952" name="__module.model.model.decoder.layers.11.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2953" name="Constant_54676" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="167339488" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2954" name="__module.model.model.decoder.layers.11.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1673,tensor.139"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2955" name="Constant_58049" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2956" name="__module.model.model.decoder.layers.11.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1675"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2957" name="__module.model.model.decoder.layers.11.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2958" name="__module.model.model.decoder.layers.11.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1676"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2959" name="__module.model.model.decoder.layers.11.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="1691,attn_output.93"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2960" name="__module.model.model.decoder.layers.11.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2961" name="__module.model.model.decoder.layers.11.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1692,attn_output.95"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="2962" name="Constant_58052" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2963" name="__module.model.model.decoder.layers.11.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1694"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2964" name="self.model.model.decoder.layers.11.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="167343584" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2965" name="Convert_1431597" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2966" name="self.model.model.decoder.layers.11.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="167867872" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2967" name="Convert_1431600" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2968" name="self.model.model.decoder.layers.11.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2969" name="self.model.model.decoder.layers.11.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="167871968" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2970" name="self.model.model.decoder.layers.11.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2971" name="Constant_1431605" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2972" name="Reshape_1431606" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2973" name="self.model.model.decoder.layers.11.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2974" name="__module.model.model.decoder.layers.11.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2975" name="Constant_54678" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="167888352" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2976" name="__module.model.model.decoder.layers.11.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1697,input.93"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2977" name="__module.model.model.decoder.layers.11/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1699,residual.71"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2978" name="__module.model.model.decoder.layers.11.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="2979" name="__module.model.model.decoder.layers.11.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2980" name="Constant_54679" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="167892448" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2981" name="__module.model.model.decoder.layers.11.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2982" name="Constant_54680" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="167896544" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2983" name="__module.model.model.decoder.layers.11.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1703"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2984" name="self.model.model.decoder.layers.11.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="167900640" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2985" name="Convert_808242" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2986" name="self.model.model.decoder.layers.11.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="169997792" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2987" name="Convert_808245" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2988" name="self.model.model.decoder.layers.11.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2989" name="self.model.model.decoder.layers.11.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="170014176" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="2990" name="self.model.model.decoder.layers.11.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="2991" name="Constant_808250" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="2992" name="Reshape_808251" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2993" name="self.model.model.decoder.layers.11.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="2994" name="__module.model.model.decoder.layers.11.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2995" name="Constant_54681" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="170079712" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2996" name="__module.model.model.decoder.layers.11.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="1706"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2997" name="__module.model.model.decoder.layers.11.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="1707,input.95"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="2998" name="self.model.model.decoder.layers.11.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="170096096" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="2999" name="Convert_812541" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3000" name="self.model.model.decoder.layers.11.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="172193248" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3001" name="Convert_812544" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3002" name="self.model.model.decoder.layers.11.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3003" name="self.model.model.decoder.layers.11.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="172209632" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3004" name="self.model.model.decoder.layers.11.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3005" name="Constant_812549" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3006" name="Reshape_812550" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3007" name="self.model.model.decoder.layers.11.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3008" name="__module.model.model.decoder.layers.11.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3009" name="Constant_54682" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="172275168" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3010" name="__module.model.model.decoder.layers.11.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1711,input.97"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3011" name="__module.model.model.decoder.layers.11/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1713,1715,residual.73"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3012" name="__module.model.model.decoder.layers.12.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3013" name="__module.model.model.decoder.layers.12.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3014" name="Constant_54683" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="172279264" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3015" name="__module.model.model.decoder.layers.12.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3016" name="Constant_54684" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="172283360" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3017" name="__module.model.model.decoder.layers.12.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1728,hidden_states.121"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3018" name="self.model.model.decoder.layers.12.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="172287456" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3019" name="Convert_1444494" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3020" name="self.model.model.decoder.layers.12.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="172811744" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3021" name="Convert_1444497" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3022" name="self.model.model.decoder.layers.12.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3023" name="self.model.model.decoder.layers.12.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="172815840" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3024" name="self.model.model.decoder.layers.12.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3025" name="Constant_1444502" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3026" name="Reshape_1444503" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3027" name="self.model.model.decoder.layers.12.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3028" name="__module.model.model.decoder.layers.12.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3029" name="Constant_54685" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="172832224" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3030" name="__module.model.model.decoder.layers.12.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1737,tensor.145"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3031" name="Constant_58053" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3032" name="__module.model.model.decoder.layers.12.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1739"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3033" name="__module.model.model.decoder.layers.12.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3034" name="__module.model.model.decoder.layers.12.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1740"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3035" name="Constant_60745" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3036" name="Constant_60738" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3037" name="Constant_60740" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3038" name="Constant_60742" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3039" name="Concat_60743" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3040" name="Broadcast_60746" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3041" name="ReadValue_59957" type="ReadValue" version="opset6"> <data variable_id="past_key_values.12.decoder.keypresent.12.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.12.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3042" name="Constant_59488" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3043" name="Gather_59489" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3044" name="self.model.model.decoder.layers.12.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="172836320" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3045" name="Convert_1440195" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3046" name="self.model.model.decoder.layers.12.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="173360608" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3047" name="Convert_1440198" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3048" name="self.model.model.decoder.layers.12.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3049" name="self.model.model.decoder.layers.12.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="173364704" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3050" name="self.model.model.decoder.layers.12.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3051" name="Constant_1440203" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3052" name="Reshape_1440204" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3053" name="self.model.model.decoder.layers.12.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3054" name="__module.model.model.decoder.layers.12.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1743,tensor.147"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3055" name="Constant_58054" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3056" name="__module.model.model.decoder.layers.12.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1745"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3057" name="__module.model.model.decoder.layers.12.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3058" name="__module.model.model.decoder.layers.12.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1746"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3059" name="__module.model.model.decoder.layers.12.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.33"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3060" name="Constant_60733" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3061" name="Constant_60726" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3062" name="Constant_60728" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3063" name="Constant_60730" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3064" name="Concat_60731" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3065" name="Broadcast_60734" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3066" name="ReadValue_59959" type="ReadValue" version="opset6"> <data variable_id="past_key_values.12.decoder.valuepresent.12.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.12.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3067" name="Constant_59491" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3068" name="Gather_59492" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3069" name="self.model.model.decoder.layers.12.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="173381088" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3070" name="Convert_1435896" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3071" name="self.model.model.decoder.layers.12.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="173905376" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3072" name="Convert_1435899" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3073" name="self.model.model.decoder.layers.12.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3074" name="self.model.model.decoder.layers.12.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="173909472" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3075" name="self.model.model.decoder.layers.12.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3076" name="Constant_1435904" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3077" name="Reshape_1435905" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3078" name="self.model.model.decoder.layers.12.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3079" name="__module.model.model.decoder.layers.12.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3080" name="Constant_54686" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="173925856" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3081" name="__module.model.model.decoder.layers.12.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1750,tensor.149"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3082" name="Constant_58055" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3083" name="__module.model.model.decoder.layers.12.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1752"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3084" name="__module.model.model.decoder.layers.12.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3085" name="__module.model.model.decoder.layers.12.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1753"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3086" name="__module.model.model.decoder.layers.12.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3087" name="__module.model.model.decoder.layers.12.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1764,attn_output.97"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3088" name="__module.model.model.decoder.layers.12.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3089" name="__module.model.model.decoder.layers.12.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1765,attn_output.99"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3090" name="Constant_58056" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3091" name="__module.model.model.decoder.layers.12.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1767"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3092" name="self.model.model.decoder.layers.12.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="173929952" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3093" name="Convert_1448793" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3094" name="self.model.model.decoder.layers.12.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="174454240" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3095" name="Convert_1448796" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3096" name="self.model.model.decoder.layers.12.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3097" name="self.model.model.decoder.layers.12.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="174458336" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3098" name="self.model.model.decoder.layers.12.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3099" name="Constant_1448801" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3100" name="Reshape_1448802" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3101" name="self.model.model.decoder.layers.12.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3102" name="__module.model.model.decoder.layers.12.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3103" name="Constant_54687" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="174474720" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3104" name="__module.model.model.decoder.layers.12.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1770,1772,input.99"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3105" name="__module.model.model.decoder.layers.12/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1776,residual.75"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3106" name="__module.model.model.decoder.layers.12.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3107" name="__module.model.model.decoder.layers.12.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3108" name="Constant_54688" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="174478816" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3109" name="__module.model.model.decoder.layers.12.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3110" name="Constant_54689" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="174482912" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3111" name="__module.model.model.decoder.layers.12.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1780,hidden_states.125"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3112" name="self.model.model.decoder.layers.12.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="174487008" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3113" name="Convert_1453092" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3114" name="self.model.model.decoder.layers.12.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="175011296" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3115" name="Convert_1453095" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3116" name="self.model.model.decoder.layers.12.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3117" name="self.model.model.decoder.layers.12.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="175015392" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3118" name="self.model.model.decoder.layers.12.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3119" name="Constant_1453100" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3120" name="Reshape_1453101" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3121" name="self.model.model.decoder.layers.12.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3122" name="__module.model.model.decoder.layers.12.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3123" name="Constant_54690" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="175031776" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3124" name="__module.model.model.decoder.layers.12.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1789,tensor.151"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3125" name="Constant_58057" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3126" name="__module.model.model.decoder.layers.12.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1791"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3127" name="__module.model.model.decoder.layers.12.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3128" name="__module.model.model.decoder.layers.12.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1792"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3129" name="__module.model.model.decoder.layers.12.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="1807,attn_output.101"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3130" name="__module.model.model.decoder.layers.12.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3131" name="__module.model.model.decoder.layers.12.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1808,attn_output.103"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3132" name="Constant_58060" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3133" name="__module.model.model.decoder.layers.12.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1810"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3134" name="self.model.model.decoder.layers.12.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="175035872" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3135" name="Convert_1457391" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3136" name="self.model.model.decoder.layers.12.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="175560160" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3137" name="Convert_1457394" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3138" name="self.model.model.decoder.layers.12.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3139" name="self.model.model.decoder.layers.12.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="175564256" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3140" name="self.model.model.decoder.layers.12.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3141" name="Constant_1457399" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3142" name="Reshape_1457400" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3143" name="self.model.model.decoder.layers.12.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3144" name="__module.model.model.decoder.layers.12.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3145" name="Constant_54692" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="175580640" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3146" name="__module.model.model.decoder.layers.12.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1813,input.101"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3147" name="__module.model.model.decoder.layers.12/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1815,residual.77"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3148" name="__module.model.model.decoder.layers.12.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3149" name="__module.model.model.decoder.layers.12.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3150" name="Constant_54693" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="175584736" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3151" name="__module.model.model.decoder.layers.12.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3152" name="Constant_54694" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="175588832" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3153" name="__module.model.model.decoder.layers.12.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1819"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3154" name="self.model.model.decoder.layers.12.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="175592928" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3155" name="Convert_816840" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3156" name="self.model.model.decoder.layers.12.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="177690080" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3157" name="Convert_816843" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3158" name="self.model.model.decoder.layers.12.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3159" name="self.model.model.decoder.layers.12.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="177706464" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3160" name="self.model.model.decoder.layers.12.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3161" name="Constant_816848" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3162" name="Reshape_816849" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3163" name="self.model.model.decoder.layers.12.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3164" name="__module.model.model.decoder.layers.12.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3165" name="Constant_54695" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="177772000" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3166" name="__module.model.model.decoder.layers.12.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="1822"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3167" name="__module.model.model.decoder.layers.12.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="1823,input.103"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3168" name="self.model.model.decoder.layers.12.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="177788384" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3169" name="Convert_821139" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3170" name="self.model.model.decoder.layers.12.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="179885536" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3171" name="Convert_821142" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3172" name="self.model.model.decoder.layers.12.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3173" name="self.model.model.decoder.layers.12.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="179901920" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3174" name="self.model.model.decoder.layers.12.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3175" name="Constant_821147" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3176" name="Reshape_821148" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3177" name="self.model.model.decoder.layers.12.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3178" name="__module.model.model.decoder.layers.12.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3179" name="Constant_54696" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="179967456" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3180" name="__module.model.model.decoder.layers.12.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1827,input.105"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3181" name="__module.model.model.decoder.layers.12/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1829,1831,residual.79"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3182" name="__module.model.model.decoder.layers.13.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3183" name="__module.model.model.decoder.layers.13.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3184" name="Constant_54697" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="179971552" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3185" name="__module.model.model.decoder.layers.13.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3186" name="Constant_54698" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="179975648" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3187" name="__module.model.model.decoder.layers.13.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1844,hidden_states.131"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3188" name="self.model.model.decoder.layers.13.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="179979744" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3189" name="Convert_1470288" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3190" name="self.model.model.decoder.layers.13.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="180504032" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3191" name="Convert_1470291" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3192" name="self.model.model.decoder.layers.13.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3193" name="self.model.model.decoder.layers.13.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="180508128" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3194" name="self.model.model.decoder.layers.13.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3195" name="Constant_1470296" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3196" name="Reshape_1470297" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3197" name="self.model.model.decoder.layers.13.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3198" name="__module.model.model.decoder.layers.13.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3199" name="Constant_54699" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="180524512" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3200" name="__module.model.model.decoder.layers.13.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1853,tensor.157"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3201" name="Constant_58061" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3202" name="__module.model.model.decoder.layers.13.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1855"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3203" name="__module.model.model.decoder.layers.13.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3204" name="__module.model.model.decoder.layers.13.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1856"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3205" name="Constant_60769" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3206" name="Constant_60762" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3207" name="Constant_60764" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3208" name="Constant_60766" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3209" name="Concat_60767" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3210" name="Broadcast_60770" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3211" name="ReadValue_59961" type="ReadValue" version="opset6"> <data variable_id="past_key_values.13.decoder.keypresent.13.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.13.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3212" name="Constant_59494" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3213" name="Gather_59495" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3214" name="self.model.model.decoder.layers.13.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="180528608" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3215" name="Convert_1465989" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3216" name="self.model.model.decoder.layers.13.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="181052896" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3217" name="Convert_1465992" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3218" name="self.model.model.decoder.layers.13.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3219" name="self.model.model.decoder.layers.13.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="181056992" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3220" name="self.model.model.decoder.layers.13.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3221" name="Constant_1465997" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3222" name="Reshape_1465998" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3223" name="self.model.model.decoder.layers.13.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3224" name="__module.model.model.decoder.layers.13.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1859,tensor.159"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3225" name="Constant_58062" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3226" name="__module.model.model.decoder.layers.13.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1861"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3227" name="__module.model.model.decoder.layers.13.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3228" name="__module.model.model.decoder.layers.13.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1862"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3229" name="__module.model.model.decoder.layers.13.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.35"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3230" name="Constant_60757" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3231" name="Constant_60750" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3232" name="Constant_60752" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3233" name="Constant_60754" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3234" name="Concat_60755" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3235" name="Broadcast_60758" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3236" name="ReadValue_59963" type="ReadValue" version="opset6"> <data variable_id="past_key_values.13.decoder.valuepresent.13.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.13.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3237" name="Constant_59497" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3238" name="Gather_59498" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3239" name="self.model.model.decoder.layers.13.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="181073376" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3240" name="Convert_1461690" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3241" name="self.model.model.decoder.layers.13.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="181597664" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3242" name="Convert_1461693" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3243" name="self.model.model.decoder.layers.13.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3244" name="self.model.model.decoder.layers.13.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="181601760" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3245" name="self.model.model.decoder.layers.13.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3246" name="Constant_1461698" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3247" name="Reshape_1461699" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3248" name="self.model.model.decoder.layers.13.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3249" name="__module.model.model.decoder.layers.13.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3250" name="Constant_54700" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="181618144" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3251" name="__module.model.model.decoder.layers.13.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1866,tensor.161"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3252" name="Constant_58063" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3253" name="__module.model.model.decoder.layers.13.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1868"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3254" name="__module.model.model.decoder.layers.13.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3255" name="__module.model.model.decoder.layers.13.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1869"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3256" name="__module.model.model.decoder.layers.13.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3257" name="__module.model.model.decoder.layers.13.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1880,attn_output.105"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3258" name="__module.model.model.decoder.layers.13.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3259" name="__module.model.model.decoder.layers.13.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1881,attn_output.107"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3260" name="Constant_58064" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3261" name="__module.model.model.decoder.layers.13.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1883"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3262" name="self.model.model.decoder.layers.13.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="181622240" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3263" name="Convert_1474587" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3264" name="self.model.model.decoder.layers.13.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="182146528" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3265" name="Convert_1474590" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3266" name="self.model.model.decoder.layers.13.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3267" name="self.model.model.decoder.layers.13.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="182150624" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3268" name="self.model.model.decoder.layers.13.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3269" name="Constant_1474595" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3270" name="Reshape_1474596" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3271" name="self.model.model.decoder.layers.13.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3272" name="__module.model.model.decoder.layers.13.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3273" name="Constant_54701" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="182167008" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3274" name="__module.model.model.decoder.layers.13.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1886,1888,input.107"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3275" name="__module.model.model.decoder.layers.13/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1892,residual.81"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3276" name="__module.model.model.decoder.layers.13.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3277" name="__module.model.model.decoder.layers.13.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3278" name="Constant_54702" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="182171104" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3279" name="__module.model.model.decoder.layers.13.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3280" name="Constant_54703" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="182175200" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3281" name="__module.model.model.decoder.layers.13.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1896,hidden_states.135"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3282" name="self.model.model.decoder.layers.13.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="182179296" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3283" name="Convert_1478886" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3284" name="self.model.model.decoder.layers.13.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="182703584" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3285" name="Convert_1478889" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3286" name="self.model.model.decoder.layers.13.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3287" name="self.model.model.decoder.layers.13.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="182707680" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3288" name="self.model.model.decoder.layers.13.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3289" name="Constant_1478894" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3290" name="Reshape_1478895" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3291" name="self.model.model.decoder.layers.13.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3292" name="__module.model.model.decoder.layers.13.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3293" name="Constant_54704" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="182724064" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3294" name="__module.model.model.decoder.layers.13.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1905,tensor.163"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3295" name="Constant_58065" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3296" name="__module.model.model.decoder.layers.13.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1907"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3297" name="__module.model.model.decoder.layers.13.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3298" name="__module.model.model.decoder.layers.13.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1908"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3299" name="__module.model.model.decoder.layers.13.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="1923,attn_output.109"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3300" name="__module.model.model.decoder.layers.13.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3301" name="__module.model.model.decoder.layers.13.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1924,attn_output.111"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3302" name="Constant_58068" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3303" name="__module.model.model.decoder.layers.13.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1926"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3304" name="self.model.model.decoder.layers.13.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="182728160" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3305" name="Convert_1483185" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3306" name="self.model.model.decoder.layers.13.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="183252448" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3307" name="Convert_1483188" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3308" name="self.model.model.decoder.layers.13.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3309" name="self.model.model.decoder.layers.13.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="183256544" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3310" name="self.model.model.decoder.layers.13.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3311" name="Constant_1483193" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3312" name="Reshape_1483194" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3313" name="self.model.model.decoder.layers.13.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3314" name="__module.model.model.decoder.layers.13.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3315" name="Constant_54706" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="183272928" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3316" name="__module.model.model.decoder.layers.13.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1929,input.109"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3317" name="__module.model.model.decoder.layers.13/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1931,residual.83"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3318" name="__module.model.model.decoder.layers.13.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3319" name="__module.model.model.decoder.layers.13.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3320" name="Constant_54707" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="183277024" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3321" name="__module.model.model.decoder.layers.13.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3322" name="Constant_54708" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="183281120" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3323" name="__module.model.model.decoder.layers.13.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1935"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3324" name="self.model.model.decoder.layers.13.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="183285216" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3325" name="Convert_825438" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3326" name="self.model.model.decoder.layers.13.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="185382368" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3327" name="Convert_825441" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3328" name="self.model.model.decoder.layers.13.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3329" name="self.model.model.decoder.layers.13.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="185398752" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3330" name="self.model.model.decoder.layers.13.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3331" name="Constant_825446" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3332" name="Reshape_825447" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3333" name="self.model.model.decoder.layers.13.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3334" name="__module.model.model.decoder.layers.13.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3335" name="Constant_54709" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="185464288" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3336" name="__module.model.model.decoder.layers.13.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="1938"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3337" name="__module.model.model.decoder.layers.13.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="1939,input.111"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3338" name="self.model.model.decoder.layers.13.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="185480672" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3339" name="Convert_829737" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3340" name="self.model.model.decoder.layers.13.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="187577824" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3341" name="Convert_829740" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3342" name="self.model.model.decoder.layers.13.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3343" name="self.model.model.decoder.layers.13.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="187594208" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3344" name="self.model.model.decoder.layers.13.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3345" name="Constant_829745" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3346" name="Reshape_829746" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3347" name="self.model.model.decoder.layers.13.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3348" name="__module.model.model.decoder.layers.13.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3349" name="Constant_54710" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="187659744" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3350" name="__module.model.model.decoder.layers.13.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1943,input.113"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3351" name="__module.model.model.decoder.layers.13/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1945,1947,residual.85"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3352" name="__module.model.model.decoder.layers.14.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3353" name="__module.model.model.decoder.layers.14.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3354" name="Constant_54711" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="187663840" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3355" name="__module.model.model.decoder.layers.14.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3356" name="Constant_54712" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="187667936" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3357" name="__module.model.model.decoder.layers.14.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1960,hidden_states.141"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3358" name="self.model.model.decoder.layers.14.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="187672032" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3359" name="Convert_1496082" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3360" name="self.model.model.decoder.layers.14.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="188196320" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3361" name="Convert_1496085" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3362" name="self.model.model.decoder.layers.14.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3363" name="self.model.model.decoder.layers.14.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="188200416" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3364" name="self.model.model.decoder.layers.14.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3365" name="Constant_1496090" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3366" name="Reshape_1496091" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3367" name="self.model.model.decoder.layers.14.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3368" name="__module.model.model.decoder.layers.14.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3369" name="Constant_54713" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="188216800" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3370" name="__module.model.model.decoder.layers.14.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1969,tensor.169"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3371" name="Constant_58069" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3372" name="__module.model.model.decoder.layers.14.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1971"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3373" name="__module.model.model.decoder.layers.14.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3374" name="__module.model.model.decoder.layers.14.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1972"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3375" name="Constant_60793" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3376" name="Constant_60786" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3377" name="Constant_60788" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3378" name="Constant_60790" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3379" name="Concat_60791" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3380" name="Broadcast_60794" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3381" name="ReadValue_59965" type="ReadValue" version="opset6"> <data variable_id="past_key_values.14.decoder.keypresent.14.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.14.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3382" name="Constant_59500" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3383" name="Gather_59501" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3384" name="self.model.model.decoder.layers.14.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="188220896" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3385" name="Convert_1491783" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3386" name="self.model.model.decoder.layers.14.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="188745184" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3387" name="Convert_1491786" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3388" name="self.model.model.decoder.layers.14.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3389" name="self.model.model.decoder.layers.14.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="188749280" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3390" name="self.model.model.decoder.layers.14.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3391" name="Constant_1491791" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3392" name="Reshape_1491792" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3393" name="self.model.model.decoder.layers.14.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3394" name="__module.model.model.decoder.layers.14.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1975,tensor.171"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3395" name="Constant_58070" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3396" name="__module.model.model.decoder.layers.14.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1977"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3397" name="__module.model.model.decoder.layers.14.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3398" name="__module.model.model.decoder.layers.14.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1978"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3399" name="__module.model.model.decoder.layers.14.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.37"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3400" name="Constant_60781" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3401" name="Constant_60774" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3402" name="Constant_60776" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3403" name="Constant_60778" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3404" name="Concat_60779" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3405" name="Broadcast_60782" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3406" name="ReadValue_59967" type="ReadValue" version="opset6"> <data variable_id="past_key_values.14.decoder.valuepresent.14.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.14.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3407" name="Constant_59503" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3408" name="Gather_59504" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3409" name="self.model.model.decoder.layers.14.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="188765664" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3410" name="Convert_1487484" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3411" name="self.model.model.decoder.layers.14.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="189289952" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3412" name="Convert_1487487" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3413" name="self.model.model.decoder.layers.14.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3414" name="self.model.model.decoder.layers.14.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="189294048" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3415" name="self.model.model.decoder.layers.14.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3416" name="Constant_1487492" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3417" name="Reshape_1487493" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3418" name="self.model.model.decoder.layers.14.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3419" name="__module.model.model.decoder.layers.14.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3420" name="Constant_54714" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="189310432" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3421" name="__module.model.model.decoder.layers.14.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="1982,tensor.173"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3422" name="Constant_58071" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3423" name="__module.model.model.decoder.layers.14.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1984"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3424" name="__module.model.model.decoder.layers.14.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3425" name="__module.model.model.decoder.layers.14.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1985"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3426" name="__module.model.model.decoder.layers.14.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3427" name="__module.model.model.decoder.layers.14.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1996,attn_output.113"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3428" name="__module.model.model.decoder.layers.14.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3429" name="__module.model.model.decoder.layers.14.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1997,attn_output.115"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3430" name="Constant_58072" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3431" name="__module.model.model.decoder.layers.14.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1999"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3432" name="self.model.model.decoder.layers.14.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="189314528" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3433" name="Convert_1500381" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3434" name="self.model.model.decoder.layers.14.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="189838816" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3435" name="Convert_1500384" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3436" name="self.model.model.decoder.layers.14.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3437" name="self.model.model.decoder.layers.14.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="189842912" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3438" name="self.model.model.decoder.layers.14.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3439" name="Constant_1500389" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3440" name="Reshape_1500390" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3441" name="self.model.model.decoder.layers.14.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3442" name="__module.model.model.decoder.layers.14.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3443" name="Constant_54715" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="189859296" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3444" name="__module.model.model.decoder.layers.14.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2002,2004,input.115"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3445" name="__module.model.model.decoder.layers.14/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2008,residual.87"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3446" name="__module.model.model.decoder.layers.14.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3447" name="__module.model.model.decoder.layers.14.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3448" name="Constant_54716" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="189863392" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3449" name="__module.model.model.decoder.layers.14.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3450" name="Constant_54717" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="189867488" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3451" name="__module.model.model.decoder.layers.14.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2012,hidden_states.145"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3452" name="self.model.model.decoder.layers.14.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="189871584" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3453" name="Convert_1504680" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3454" name="self.model.model.decoder.layers.14.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="190395872" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3455" name="Convert_1504683" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3456" name="self.model.model.decoder.layers.14.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3457" name="self.model.model.decoder.layers.14.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="190399968" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3458" name="self.model.model.decoder.layers.14.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3459" name="Constant_1504688" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3460" name="Reshape_1504689" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3461" name="self.model.model.decoder.layers.14.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3462" name="__module.model.model.decoder.layers.14.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3463" name="Constant_54718" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="190416352" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3464" name="__module.model.model.decoder.layers.14.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2021,tensor.175"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3465" name="Constant_58073" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3466" name="__module.model.model.decoder.layers.14.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2023"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3467" name="__module.model.model.decoder.layers.14.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3468" name="__module.model.model.decoder.layers.14.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2024"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3469" name="__module.model.model.decoder.layers.14.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="2039,attn_output.117"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3470" name="__module.model.model.decoder.layers.14.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3471" name="__module.model.model.decoder.layers.14.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2040,attn_output.119"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3472" name="Constant_58076" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3473" name="__module.model.model.decoder.layers.14.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2042"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3474" name="self.model.model.decoder.layers.14.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="190420448" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3475" name="Convert_1508979" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3476" name="self.model.model.decoder.layers.14.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="190944736" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3477" name="Convert_1508982" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3478" name="self.model.model.decoder.layers.14.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3479" name="self.model.model.decoder.layers.14.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="190948832" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3480" name="self.model.model.decoder.layers.14.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3481" name="Constant_1508987" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3482" name="Reshape_1508988" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3483" name="self.model.model.decoder.layers.14.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3484" name="__module.model.model.decoder.layers.14.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3485" name="Constant_54720" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="190965216" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3486" name="__module.model.model.decoder.layers.14.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2045,input.117"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3487" name="__module.model.model.decoder.layers.14/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2047,residual.89"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3488" name="__module.model.model.decoder.layers.14.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3489" name="__module.model.model.decoder.layers.14.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3490" name="Constant_54721" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="190969312" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3491" name="__module.model.model.decoder.layers.14.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3492" name="Constant_54722" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="190973408" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3493" name="__module.model.model.decoder.layers.14.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2051"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3494" name="self.model.model.decoder.layers.14.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="190977504" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3495" name="Convert_834036" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3496" name="self.model.model.decoder.layers.14.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="193074656" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3497" name="Convert_834039" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3498" name="self.model.model.decoder.layers.14.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3499" name="self.model.model.decoder.layers.14.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="193091040" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3500" name="self.model.model.decoder.layers.14.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3501" name="Constant_834044" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3502" name="Reshape_834045" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3503" name="self.model.model.decoder.layers.14.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3504" name="__module.model.model.decoder.layers.14.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3505" name="Constant_54723" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="193156576" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3506" name="__module.model.model.decoder.layers.14.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="2054"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3507" name="__module.model.model.decoder.layers.14.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="2055,input.119"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3508" name="self.model.model.decoder.layers.14.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="193172960" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3509" name="Convert_838335" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3510" name="self.model.model.decoder.layers.14.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="195270112" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3511" name="Convert_838338" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3512" name="self.model.model.decoder.layers.14.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3513" name="self.model.model.decoder.layers.14.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="195286496" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3514" name="self.model.model.decoder.layers.14.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3515" name="Constant_838343" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3516" name="Reshape_838344" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3517" name="self.model.model.decoder.layers.14.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3518" name="__module.model.model.decoder.layers.14.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3519" name="Constant_54724" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="195352032" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3520" name="__module.model.model.decoder.layers.14.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2059,input.121"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3521" name="__module.model.model.decoder.layers.14/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2061,2063,residual.91"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3522" name="__module.model.model.decoder.layers.15.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3523" name="__module.model.model.decoder.layers.15.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3524" name="Constant_54725" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="195356128" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3525" name="__module.model.model.decoder.layers.15.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3526" name="Constant_54726" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="195360224" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3527" name="__module.model.model.decoder.layers.15.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2076,hidden_states.151"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3528" name="self.model.model.decoder.layers.15.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="195364320" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3529" name="Convert_1521876" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3530" name="self.model.model.decoder.layers.15.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="195888608" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3531" name="Convert_1521879" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3532" name="self.model.model.decoder.layers.15.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3533" name="self.model.model.decoder.layers.15.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="195892704" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3534" name="self.model.model.decoder.layers.15.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3535" name="Constant_1521884" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3536" name="Reshape_1521885" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3537" name="self.model.model.decoder.layers.15.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3538" name="__module.model.model.decoder.layers.15.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3539" name="Constant_54727" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="195909088" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3540" name="__module.model.model.decoder.layers.15.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2085,tensor.181"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3541" name="Constant_58077" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3542" name="__module.model.model.decoder.layers.15.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2087"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3543" name="__module.model.model.decoder.layers.15.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3544" name="__module.model.model.decoder.layers.15.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2088"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3545" name="Constant_60817" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3546" name="Constant_60810" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3547" name="Constant_60812" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3548" name="Constant_60814" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3549" name="Concat_60815" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3550" name="Broadcast_60818" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3551" name="ReadValue_59969" type="ReadValue" version="opset6"> <data variable_id="past_key_values.15.decoder.keypresent.15.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.15.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3552" name="Constant_59506" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3553" name="Gather_59507" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3554" name="self.model.model.decoder.layers.15.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="195913184" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3555" name="Convert_1517577" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3556" name="self.model.model.decoder.layers.15.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="196437472" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3557" name="Convert_1517580" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3558" name="self.model.model.decoder.layers.15.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3559" name="self.model.model.decoder.layers.15.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="196441568" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3560" name="self.model.model.decoder.layers.15.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3561" name="Constant_1517585" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3562" name="Reshape_1517586" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3563" name="self.model.model.decoder.layers.15.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3564" name="__module.model.model.decoder.layers.15.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2091,tensor.183"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3565" name="Constant_58078" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3566" name="__module.model.model.decoder.layers.15.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2093"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3567" name="__module.model.model.decoder.layers.15.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3568" name="__module.model.model.decoder.layers.15.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2094"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3569" name="__module.model.model.decoder.layers.15.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.39"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3570" name="Constant_60805" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3571" name="Constant_60798" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3572" name="Constant_60800" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3573" name="Constant_60802" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3574" name="Concat_60803" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3575" name="Broadcast_60806" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3576" name="ReadValue_59971" type="ReadValue" version="opset6"> <data variable_id="past_key_values.15.decoder.valuepresent.15.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.15.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3577" name="Constant_59509" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3578" name="Gather_59510" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3579" name="self.model.model.decoder.layers.15.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="196457952" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3580" name="Convert_1513278" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3581" name="self.model.model.decoder.layers.15.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="196982240" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3582" name="Convert_1513281" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3583" name="self.model.model.decoder.layers.15.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3584" name="self.model.model.decoder.layers.15.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="196986336" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3585" name="self.model.model.decoder.layers.15.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3586" name="Constant_1513286" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3587" name="Reshape_1513287" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3588" name="self.model.model.decoder.layers.15.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3589" name="__module.model.model.decoder.layers.15.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3590" name="Constant_54728" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="197002720" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3591" name="__module.model.model.decoder.layers.15.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2098,tensor.185"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3592" name="Constant_58079" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3593" name="__module.model.model.decoder.layers.15.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2100"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3594" name="__module.model.model.decoder.layers.15.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3595" name="__module.model.model.decoder.layers.15.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2101"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3596" name="__module.model.model.decoder.layers.15.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3597" name="__module.model.model.decoder.layers.15.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2112,attn_output.121"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3598" name="__module.model.model.decoder.layers.15.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3599" name="__module.model.model.decoder.layers.15.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2113,attn_output.123"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3600" name="Constant_58080" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3601" name="__module.model.model.decoder.layers.15.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2115"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3602" name="self.model.model.decoder.layers.15.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="197006816" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3603" name="Convert_1526175" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3604" name="self.model.model.decoder.layers.15.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="197531104" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3605" name="Convert_1526178" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3606" name="self.model.model.decoder.layers.15.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3607" name="self.model.model.decoder.layers.15.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="197535200" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3608" name="self.model.model.decoder.layers.15.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3609" name="Constant_1526183" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3610" name="Reshape_1526184" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3611" name="self.model.model.decoder.layers.15.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3612" name="__module.model.model.decoder.layers.15.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3613" name="Constant_54729" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="197551584" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3614" name="__module.model.model.decoder.layers.15.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2118,2120,input.123"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3615" name="__module.model.model.decoder.layers.15/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2124,residual.93"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3616" name="__module.model.model.decoder.layers.15.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3617" name="__module.model.model.decoder.layers.15.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3618" name="Constant_54730" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="197555680" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3619" name="__module.model.model.decoder.layers.15.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3620" name="Constant_54731" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="197559776" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3621" name="__module.model.model.decoder.layers.15.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2128,hidden_states.155"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3622" name="self.model.model.decoder.layers.15.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="197563872" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3623" name="Convert_1530474" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3624" name="self.model.model.decoder.layers.15.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="198088160" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3625" name="Convert_1530477" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3626" name="self.model.model.decoder.layers.15.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3627" name="self.model.model.decoder.layers.15.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="198092256" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3628" name="self.model.model.decoder.layers.15.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3629" name="Constant_1530482" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3630" name="Reshape_1530483" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3631" name="self.model.model.decoder.layers.15.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3632" name="__module.model.model.decoder.layers.15.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3633" name="Constant_54732" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="198108640" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3634" name="__module.model.model.decoder.layers.15.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2137,tensor.187"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3635" name="Constant_58081" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3636" name="__module.model.model.decoder.layers.15.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2139"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3637" name="__module.model.model.decoder.layers.15.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3638" name="__module.model.model.decoder.layers.15.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2140"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3639" name="__module.model.model.decoder.layers.15.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="2155,attn_output.125"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3640" name="__module.model.model.decoder.layers.15.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3641" name="__module.model.model.decoder.layers.15.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2156,attn_output.127"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3642" name="Constant_58084" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3643" name="__module.model.model.decoder.layers.15.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2158"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3644" name="self.model.model.decoder.layers.15.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="198112736" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3645" name="Convert_1534773" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3646" name="self.model.model.decoder.layers.15.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="198637024" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3647" name="Convert_1534776" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3648" name="self.model.model.decoder.layers.15.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3649" name="self.model.model.decoder.layers.15.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="198641120" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3650" name="self.model.model.decoder.layers.15.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3651" name="Constant_1534781" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3652" name="Reshape_1534782" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3653" name="self.model.model.decoder.layers.15.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3654" name="__module.model.model.decoder.layers.15.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3655" name="Constant_54734" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="198657504" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3656" name="__module.model.model.decoder.layers.15.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2161,input.125"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3657" name="__module.model.model.decoder.layers.15/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2163,residual.95"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3658" name="__module.model.model.decoder.layers.15.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3659" name="__module.model.model.decoder.layers.15.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3660" name="Constant_54735" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="198661600" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3661" name="__module.model.model.decoder.layers.15.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3662" name="Constant_54736" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="198665696" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3663" name="__module.model.model.decoder.layers.15.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2167"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3664" name="self.model.model.decoder.layers.15.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="198669792" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3665" name="Convert_842634" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3666" name="self.model.model.decoder.layers.15.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="200766944" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3667" name="Convert_842637" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3668" name="self.model.model.decoder.layers.15.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3669" name="self.model.model.decoder.layers.15.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="200783328" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3670" name="self.model.model.decoder.layers.15.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3671" name="Constant_842642" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3672" name="Reshape_842643" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3673" name="self.model.model.decoder.layers.15.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3674" name="__module.model.model.decoder.layers.15.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3675" name="Constant_54737" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="200848864" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3676" name="__module.model.model.decoder.layers.15.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="2170"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3677" name="__module.model.model.decoder.layers.15.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="2171,input.127"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3678" name="self.model.model.decoder.layers.15.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="200865248" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3679" name="Convert_846933" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3680" name="self.model.model.decoder.layers.15.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="202962400" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3681" name="Convert_846936" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3682" name="self.model.model.decoder.layers.15.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3683" name="self.model.model.decoder.layers.15.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="202978784" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3684" name="self.model.model.decoder.layers.15.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3685" name="Constant_846941" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3686" name="Reshape_846942" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3687" name="self.model.model.decoder.layers.15.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3688" name="__module.model.model.decoder.layers.15.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3689" name="Constant_54738" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="203044320" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3690" name="__module.model.model.decoder.layers.15.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2175,input.129"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3691" name="__module.model.model.decoder.layers.15/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2177,2179,residual.97"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3692" name="__module.model.model.decoder.layers.16.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3693" name="__module.model.model.decoder.layers.16.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3694" name="Constant_54739" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="203048416" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3695" name="__module.model.model.decoder.layers.16.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3696" name="Constant_54740" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="203052512" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3697" name="__module.model.model.decoder.layers.16.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2192,hidden_states.161"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3698" name="self.model.model.decoder.layers.16.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="203056608" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3699" name="Convert_1547670" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3700" name="self.model.model.decoder.layers.16.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="203580896" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3701" name="Convert_1547673" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3702" name="self.model.model.decoder.layers.16.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3703" name="self.model.model.decoder.layers.16.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="203584992" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3704" name="self.model.model.decoder.layers.16.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3705" name="Constant_1547678" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3706" name="Reshape_1547679" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3707" name="self.model.model.decoder.layers.16.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3708" name="__module.model.model.decoder.layers.16.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3709" name="Constant_54741" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="203601376" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3710" name="__module.model.model.decoder.layers.16.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2201,tensor.193"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3711" name="Constant_58085" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3712" name="__module.model.model.decoder.layers.16.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2203"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3713" name="__module.model.model.decoder.layers.16.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3714" name="__module.model.model.decoder.layers.16.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2204"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3715" name="Constant_60841" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3716" name="Constant_60834" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3717" name="Constant_60836" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3718" name="Constant_60838" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3719" name="Concat_60839" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3720" name="Broadcast_60842" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3721" name="ReadValue_59973" type="ReadValue" version="opset6"> <data variable_id="past_key_values.16.decoder.keypresent.16.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.16.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3722" name="Constant_59512" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3723" name="Gather_59513" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3724" name="self.model.model.decoder.layers.16.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="203605472" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3725" name="Convert_1543371" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3726" name="self.model.model.decoder.layers.16.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="204129760" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3727" name="Convert_1543374" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3728" name="self.model.model.decoder.layers.16.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3729" name="self.model.model.decoder.layers.16.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="204133856" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3730" name="self.model.model.decoder.layers.16.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3731" name="Constant_1543379" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3732" name="Reshape_1543380" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3733" name="self.model.model.decoder.layers.16.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3734" name="__module.model.model.decoder.layers.16.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2207,tensor.195"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3735" name="Constant_58086" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3736" name="__module.model.model.decoder.layers.16.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2209"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3737" name="__module.model.model.decoder.layers.16.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3738" name="__module.model.model.decoder.layers.16.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2210"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3739" name="__module.model.model.decoder.layers.16.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.41"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3740" name="Constant_60829" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3741" name="Constant_60822" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3742" name="Constant_60824" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3743" name="Constant_60826" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3744" name="Concat_60827" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3745" name="Broadcast_60830" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3746" name="ReadValue_59975" type="ReadValue" version="opset6"> <data variable_id="past_key_values.16.decoder.valuepresent.16.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.16.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3747" name="Constant_59515" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3748" name="Gather_59516" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3749" name="self.model.model.decoder.layers.16.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="204150240" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3750" name="Convert_1539072" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3751" name="self.model.model.decoder.layers.16.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="204674528" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3752" name="Convert_1539075" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3753" name="self.model.model.decoder.layers.16.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3754" name="self.model.model.decoder.layers.16.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="204678624" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3755" name="self.model.model.decoder.layers.16.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3756" name="Constant_1539080" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3757" name="Reshape_1539081" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3758" name="self.model.model.decoder.layers.16.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3759" name="__module.model.model.decoder.layers.16.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3760" name="Constant_54742" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="204695008" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3761" name="__module.model.model.decoder.layers.16.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2214,tensor.197"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3762" name="Constant_58087" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3763" name="__module.model.model.decoder.layers.16.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2216"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3764" name="__module.model.model.decoder.layers.16.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3765" name="__module.model.model.decoder.layers.16.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2217"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3766" name="__module.model.model.decoder.layers.16.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3767" name="__module.model.model.decoder.layers.16.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2228,attn_output.129"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3768" name="__module.model.model.decoder.layers.16.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3769" name="__module.model.model.decoder.layers.16.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2229,attn_output.131"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3770" name="Constant_58088" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3771" name="__module.model.model.decoder.layers.16.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2231"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3772" name="self.model.model.decoder.layers.16.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="204699104" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3773" name="Convert_1551969" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3774" name="self.model.model.decoder.layers.16.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="205223392" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3775" name="Convert_1551972" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3776" name="self.model.model.decoder.layers.16.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3777" name="self.model.model.decoder.layers.16.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="205227488" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3778" name="self.model.model.decoder.layers.16.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3779" name="Constant_1551977" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3780" name="Reshape_1551978" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3781" name="self.model.model.decoder.layers.16.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3782" name="__module.model.model.decoder.layers.16.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3783" name="Constant_54743" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="205243872" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3784" name="__module.model.model.decoder.layers.16.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2234,2236,input.131"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3785" name="__module.model.model.decoder.layers.16/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2240,residual.99"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3786" name="__module.model.model.decoder.layers.16.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3787" name="__module.model.model.decoder.layers.16.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3788" name="Constant_54744" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="205247968" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3789" name="__module.model.model.decoder.layers.16.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3790" name="Constant_54745" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="205252064" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3791" name="__module.model.model.decoder.layers.16.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2244,hidden_states.165"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3792" name="self.model.model.decoder.layers.16.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="205256160" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3793" name="Convert_1556268" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3794" name="self.model.model.decoder.layers.16.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="205780448" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3795" name="Convert_1556271" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3796" name="self.model.model.decoder.layers.16.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3797" name="self.model.model.decoder.layers.16.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="205784544" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3798" name="self.model.model.decoder.layers.16.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3799" name="Constant_1556276" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3800" name="Reshape_1556277" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3801" name="self.model.model.decoder.layers.16.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3802" name="__module.model.model.decoder.layers.16.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3803" name="Constant_54746" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="205800928" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3804" name="__module.model.model.decoder.layers.16.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2253,tensor.199"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3805" name="Constant_58089" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3806" name="__module.model.model.decoder.layers.16.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2255"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3807" name="__module.model.model.decoder.layers.16.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3808" name="__module.model.model.decoder.layers.16.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2256"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3809" name="__module.model.model.decoder.layers.16.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="2271,attn_output.133"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3810" name="__module.model.model.decoder.layers.16.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3811" name="__module.model.model.decoder.layers.16.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2272,attn_output.135"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3812" name="Constant_58092" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3813" name="__module.model.model.decoder.layers.16.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2274"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3814" name="self.model.model.decoder.layers.16.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="205805024" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3815" name="Convert_1560567" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3816" name="self.model.model.decoder.layers.16.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="206329312" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3817" name="Convert_1560570" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3818" name="self.model.model.decoder.layers.16.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3819" name="self.model.model.decoder.layers.16.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="206333408" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3820" name="self.model.model.decoder.layers.16.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3821" name="Constant_1560575" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3822" name="Reshape_1560576" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3823" name="self.model.model.decoder.layers.16.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3824" name="__module.model.model.decoder.layers.16.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3825" name="Constant_54748" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="206349792" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3826" name="__module.model.model.decoder.layers.16.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2277,input.133"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3827" name="__module.model.model.decoder.layers.16/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2279,residual.101"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3828" name="__module.model.model.decoder.layers.16.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3829" name="__module.model.model.decoder.layers.16.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3830" name="Constant_54749" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="206353888" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3831" name="__module.model.model.decoder.layers.16.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3832" name="Constant_54750" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="206357984" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3833" name="__module.model.model.decoder.layers.16.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2283"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3834" name="self.model.model.decoder.layers.16.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="206362080" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3835" name="Convert_851232" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3836" name="self.model.model.decoder.layers.16.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="208459232" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3837" name="Convert_851235" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3838" name="self.model.model.decoder.layers.16.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3839" name="self.model.model.decoder.layers.16.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="208475616" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3840" name="self.model.model.decoder.layers.16.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3841" name="Constant_851240" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3842" name="Reshape_851241" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3843" name="self.model.model.decoder.layers.16.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3844" name="__module.model.model.decoder.layers.16.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3845" name="Constant_54751" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="208541152" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3846" name="__module.model.model.decoder.layers.16.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="2286"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3847" name="__module.model.model.decoder.layers.16.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="2287,input.135"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3848" name="self.model.model.decoder.layers.16.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="208557536" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3849" name="Convert_855531" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3850" name="self.model.model.decoder.layers.16.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="210654688" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3851" name="Convert_855534" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3852" name="self.model.model.decoder.layers.16.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3853" name="self.model.model.decoder.layers.16.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="210671072" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="3854" name="self.model.model.decoder.layers.16.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="3855" name="Constant_855539" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3856" name="Reshape_855540" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3857" name="self.model.model.decoder.layers.16.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="3858" name="__module.model.model.decoder.layers.16.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3859" name="Constant_54752" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="210736608" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3860" name="__module.model.model.decoder.layers.16.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2291,input.137"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3861" name="__module.model.model.decoder.layers.16/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2293,2295,residual.103"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3862" name="__module.model.model.decoder.layers.17.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3863" name="__module.model.model.decoder.layers.17.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3864" name="Constant_54753" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="210740704" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3865" name="__module.model.model.decoder.layers.17.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3866" name="Constant_54754" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="210744800" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3867" name="__module.model.model.decoder.layers.17.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2308,hidden_states.171"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3868" name="self.model.model.decoder.layers.17.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="210748896" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3869" name="Convert_1573464" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3870" name="self.model.model.decoder.layers.17.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="211273184" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3871" name="Convert_1573467" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3872" name="self.model.model.decoder.layers.17.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3873" name="self.model.model.decoder.layers.17.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="211277280" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3874" name="self.model.model.decoder.layers.17.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3875" name="Constant_1573472" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3876" name="Reshape_1573473" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3877" name="self.model.model.decoder.layers.17.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3878" name="__module.model.model.decoder.layers.17.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3879" name="Constant_54755" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="211293664" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3880" name="__module.model.model.decoder.layers.17.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2317,tensor.205"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3881" name="Constant_58093" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3882" name="__module.model.model.decoder.layers.17.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2319"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3883" name="__module.model.model.decoder.layers.17.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3884" name="__module.model.model.decoder.layers.17.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2320"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3885" name="Constant_60865" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3886" name="Constant_60858" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3887" name="Constant_60860" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3888" name="Constant_60862" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3889" name="Concat_60863" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3890" name="Broadcast_60866" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3891" name="ReadValue_59977" type="ReadValue" version="opset6"> <data variable_id="past_key_values.17.decoder.keypresent.17.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.17.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3892" name="Constant_59518" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3893" name="Gather_59519" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3894" name="self.model.model.decoder.layers.17.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="211297760" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3895" name="Convert_1569165" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3896" name="self.model.model.decoder.layers.17.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="211822048" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3897" name="Convert_1569168" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3898" name="self.model.model.decoder.layers.17.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3899" name="self.model.model.decoder.layers.17.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="211826144" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3900" name="self.model.model.decoder.layers.17.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3901" name="Constant_1569173" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3902" name="Reshape_1569174" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3903" name="self.model.model.decoder.layers.17.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3904" name="__module.model.model.decoder.layers.17.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2323,tensor.207"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3905" name="Constant_58094" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3906" name="__module.model.model.decoder.layers.17.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2325"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3907" name="__module.model.model.decoder.layers.17.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3908" name="__module.model.model.decoder.layers.17.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2326"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3909" name="__module.model.model.decoder.layers.17.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.43"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3910" name="Constant_60853" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="3911" name="Constant_60846" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3912" name="Constant_60848" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3913" name="Constant_60850" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3914" name="Concat_60851" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3915" name="Broadcast_60854" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="3916" name="ReadValue_59979" type="ReadValue" version="opset6"> <data variable_id="past_key_values.17.decoder.valuepresent.17.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.17.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3917" name="Constant_59521" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3918" name="Gather_59522" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3919" name="self.model.model.decoder.layers.17.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="211842528" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3920" name="Convert_1564866" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3921" name="self.model.model.decoder.layers.17.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="212366816" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3922" name="Convert_1564869" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3923" name="self.model.model.decoder.layers.17.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3924" name="self.model.model.decoder.layers.17.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="212370912" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3925" name="self.model.model.decoder.layers.17.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3926" name="Constant_1564874" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3927" name="Reshape_1564875" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3928" name="self.model.model.decoder.layers.17.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3929" name="__module.model.model.decoder.layers.17.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3930" name="Constant_54756" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="212387296" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3931" name="__module.model.model.decoder.layers.17.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2330,tensor.209"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3932" name="Constant_58095" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3933" name="__module.model.model.decoder.layers.17.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2332"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3934" name="__module.model.model.decoder.layers.17.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3935" name="__module.model.model.decoder.layers.17.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2333"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3936" name="__module.model.model.decoder.layers.17.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3937" name="__module.model.model.decoder.layers.17.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2344,attn_output.137"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3938" name="__module.model.model.decoder.layers.17.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3939" name="__module.model.model.decoder.layers.17.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2345,attn_output.139"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3940" name="Constant_58096" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3941" name="__module.model.model.decoder.layers.17.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2347"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3942" name="self.model.model.decoder.layers.17.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="212391392" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3943" name="Convert_1577763" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3944" name="self.model.model.decoder.layers.17.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="212915680" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3945" name="Convert_1577766" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3946" name="self.model.model.decoder.layers.17.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3947" name="self.model.model.decoder.layers.17.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="212919776" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3948" name="self.model.model.decoder.layers.17.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3949" name="Constant_1577771" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3950" name="Reshape_1577772" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3951" name="self.model.model.decoder.layers.17.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3952" name="__module.model.model.decoder.layers.17.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3953" name="Constant_54757" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="212936160" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3954" name="__module.model.model.decoder.layers.17.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2350,2352,input.139"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3955" name="__module.model.model.decoder.layers.17/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2356,residual.105"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3956" name="__module.model.model.decoder.layers.17.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3957" name="__module.model.model.decoder.layers.17.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3958" name="Constant_54758" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="212940256" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3959" name="__module.model.model.decoder.layers.17.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3960" name="Constant_54759" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="212944352" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3961" name="__module.model.model.decoder.layers.17.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2360,hidden_states.175"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3962" name="self.model.model.decoder.layers.17.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="212948448" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3963" name="Convert_1582062" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3964" name="self.model.model.decoder.layers.17.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="213472736" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3965" name="Convert_1582065" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3966" name="self.model.model.decoder.layers.17.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3967" name="self.model.model.decoder.layers.17.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="213476832" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3968" name="self.model.model.decoder.layers.17.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3969" name="Constant_1582070" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3970" name="Reshape_1582071" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3971" name="self.model.model.decoder.layers.17.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3972" name="__module.model.model.decoder.layers.17.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3973" name="Constant_54760" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="213493216" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3974" name="__module.model.model.decoder.layers.17.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2369,tensor.211"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3975" name="Constant_58097" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3976" name="__module.model.model.decoder.layers.17.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2371"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3977" name="__module.model.model.decoder.layers.17.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3978" name="__module.model.model.decoder.layers.17.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2372"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3979" name="__module.model.model.decoder.layers.17.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="2387,attn_output.141"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="3980" name="__module.model.model.decoder.layers.17.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3981" name="__module.model.model.decoder.layers.17.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2388,attn_output.143"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="3982" name="Constant_58100" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3983" name="__module.model.model.decoder.layers.17.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2390"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3984" name="self.model.model.decoder.layers.17.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="213497312" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3985" name="Convert_1586361" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3986" name="self.model.model.decoder.layers.17.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="214021600" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3987" name="Convert_1586364" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3988" name="self.model.model.decoder.layers.17.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3989" name="self.model.model.decoder.layers.17.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="214025696" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="3990" name="self.model.model.decoder.layers.17.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="3991" name="Constant_1586369" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="3992" name="Reshape_1586370" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3993" name="self.model.model.decoder.layers.17.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3994" name="__module.model.model.decoder.layers.17.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3995" name="Constant_54762" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="214042080" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3996" name="__module.model.model.decoder.layers.17.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2393,input.141"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3997" name="__module.model.model.decoder.layers.17/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2395,residual.107"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="3998" name="__module.model.model.decoder.layers.17.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="3999" name="__module.model.model.decoder.layers.17.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4000" name="Constant_54763" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="214046176" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4001" name="__module.model.model.decoder.layers.17.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4002" name="Constant_54764" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="214050272" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4003" name="__module.model.model.decoder.layers.17.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2399"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4004" name="self.model.model.decoder.layers.17.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="214054368" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4005" name="Convert_859830" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4006" name="self.model.model.decoder.layers.17.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="216151520" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4007" name="Convert_859833" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4008" name="self.model.model.decoder.layers.17.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4009" name="self.model.model.decoder.layers.17.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="216167904" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4010" name="self.model.model.decoder.layers.17.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4011" name="Constant_859838" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4012" name="Reshape_859839" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4013" name="self.model.model.decoder.layers.17.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4014" name="__module.model.model.decoder.layers.17.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4015" name="Constant_54765" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="216233440" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4016" name="__module.model.model.decoder.layers.17.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="2402"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4017" name="__module.model.model.decoder.layers.17.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="2403,input.143"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4018" name="self.model.model.decoder.layers.17.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="216249824" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4019" name="Convert_864129" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4020" name="self.model.model.decoder.layers.17.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="218346976" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4021" name="Convert_864132" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4022" name="self.model.model.decoder.layers.17.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4023" name="self.model.model.decoder.layers.17.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="218363360" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4024" name="self.model.model.decoder.layers.17.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4025" name="Constant_864137" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4026" name="Reshape_864138" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4027" name="self.model.model.decoder.layers.17.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4028" name="__module.model.model.decoder.layers.17.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4029" name="Constant_54766" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="218428896" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4030" name="__module.model.model.decoder.layers.17.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2407,input.145"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4031" name="__module.model.model.decoder.layers.17/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2409,2411,residual.109"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4032" name="__module.model.model.decoder.layers.18.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4033" name="__module.model.model.decoder.layers.18.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4034" name="Constant_54767" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="218432992" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4035" name="__module.model.model.decoder.layers.18.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4036" name="Constant_54768" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="218437088" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4037" name="__module.model.model.decoder.layers.18.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2424,hidden_states.181"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4038" name="self.model.model.decoder.layers.18.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="218441184" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4039" name="Convert_1599258" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4040" name="self.model.model.decoder.layers.18.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="218965472" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4041" name="Convert_1599261" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4042" name="self.model.model.decoder.layers.18.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4043" name="self.model.model.decoder.layers.18.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="218969568" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4044" name="self.model.model.decoder.layers.18.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4045" name="Constant_1599266" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4046" name="Reshape_1599267" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4047" name="self.model.model.decoder.layers.18.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4048" name="__module.model.model.decoder.layers.18.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4049" name="Constant_54769" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="218985952" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4050" name="__module.model.model.decoder.layers.18.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2433,tensor.217"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4051" name="Constant_58101" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4052" name="__module.model.model.decoder.layers.18.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2435"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4053" name="__module.model.model.decoder.layers.18.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4054" name="__module.model.model.decoder.layers.18.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2436"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4055" name="Constant_60889" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4056" name="Constant_60882" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4057" name="Constant_60884" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4058" name="Constant_60886" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4059" name="Concat_60887" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4060" name="Broadcast_60890" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4061" name="ReadValue_59981" type="ReadValue" version="opset6"> <data variable_id="past_key_values.18.decoder.keypresent.18.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.18.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4062" name="Constant_59524" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4063" name="Gather_59525" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4064" name="self.model.model.decoder.layers.18.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="218990048" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4065" name="Convert_1594959" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4066" name="self.model.model.decoder.layers.18.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="219514336" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4067" name="Convert_1594962" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4068" name="self.model.model.decoder.layers.18.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4069" name="self.model.model.decoder.layers.18.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="219518432" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4070" name="self.model.model.decoder.layers.18.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4071" name="Constant_1594967" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4072" name="Reshape_1594968" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4073" name="self.model.model.decoder.layers.18.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4074" name="__module.model.model.decoder.layers.18.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2439,tensor.219"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4075" name="Constant_58102" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4076" name="__module.model.model.decoder.layers.18.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2441"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4077" name="__module.model.model.decoder.layers.18.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4078" name="__module.model.model.decoder.layers.18.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2442"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4079" name="__module.model.model.decoder.layers.18.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.45"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4080" name="Constant_60877" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4081" name="Constant_60870" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4082" name="Constant_60872" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4083" name="Constant_60874" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4084" name="Concat_60875" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4085" name="Broadcast_60878" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4086" name="ReadValue_59983" type="ReadValue" version="opset6"> <data variable_id="past_key_values.18.decoder.valuepresent.18.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.18.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4087" name="Constant_59527" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4088" name="Gather_59528" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4089" name="self.model.model.decoder.layers.18.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="219534816" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4090" name="Convert_1590660" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4091" name="self.model.model.decoder.layers.18.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="220059104" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4092" name="Convert_1590663" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4093" name="self.model.model.decoder.layers.18.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4094" name="self.model.model.decoder.layers.18.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="220063200" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4095" name="self.model.model.decoder.layers.18.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4096" name="Constant_1590668" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4097" name="Reshape_1590669" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4098" name="self.model.model.decoder.layers.18.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4099" name="__module.model.model.decoder.layers.18.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4100" name="Constant_54770" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="220079584" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4101" name="__module.model.model.decoder.layers.18.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2446,tensor.221"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4102" name="Constant_58103" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4103" name="__module.model.model.decoder.layers.18.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2448"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4104" name="__module.model.model.decoder.layers.18.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4105" name="__module.model.model.decoder.layers.18.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2449"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4106" name="__module.model.model.decoder.layers.18.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4107" name="__module.model.model.decoder.layers.18.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2460,attn_output.145"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4108" name="__module.model.model.decoder.layers.18.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4109" name="__module.model.model.decoder.layers.18.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2461,attn_output.147"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4110" name="Constant_58104" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4111" name="__module.model.model.decoder.layers.18.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2463"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4112" name="self.model.model.decoder.layers.18.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="220083680" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4113" name="Convert_1603557" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4114" name="self.model.model.decoder.layers.18.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="220607968" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4115" name="Convert_1603560" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4116" name="self.model.model.decoder.layers.18.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4117" name="self.model.model.decoder.layers.18.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="220612064" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4118" name="self.model.model.decoder.layers.18.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4119" name="Constant_1603565" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4120" name="Reshape_1603566" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4121" name="self.model.model.decoder.layers.18.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4122" name="__module.model.model.decoder.layers.18.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4123" name="Constant_54771" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="220628448" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4124" name="__module.model.model.decoder.layers.18.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2466,2468,input.147"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4125" name="__module.model.model.decoder.layers.18/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2472,residual.111"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4126" name="__module.model.model.decoder.layers.18.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4127" name="__module.model.model.decoder.layers.18.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4128" name="Constant_54772" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="220632544" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4129" name="__module.model.model.decoder.layers.18.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4130" name="Constant_54773" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="220636640" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4131" name="__module.model.model.decoder.layers.18.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2476,hidden_states.185"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4132" name="self.model.model.decoder.layers.18.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="220640736" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4133" name="Convert_1607856" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4134" name="self.model.model.decoder.layers.18.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="221165024" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4135" name="Convert_1607859" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4136" name="self.model.model.decoder.layers.18.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4137" name="self.model.model.decoder.layers.18.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="221169120" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4138" name="self.model.model.decoder.layers.18.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4139" name="Constant_1607864" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4140" name="Reshape_1607865" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4141" name="self.model.model.decoder.layers.18.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4142" name="__module.model.model.decoder.layers.18.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4143" name="Constant_54774" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="221185504" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4144" name="__module.model.model.decoder.layers.18.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2485,tensor.223"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4145" name="Constant_58105" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4146" name="__module.model.model.decoder.layers.18.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2487"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4147" name="__module.model.model.decoder.layers.18.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4148" name="__module.model.model.decoder.layers.18.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2488"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4149" name="__module.model.model.decoder.layers.18.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="2503,attn_output.149"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4150" name="__module.model.model.decoder.layers.18.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4151" name="__module.model.model.decoder.layers.18.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2504,attn_output.151"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4152" name="Constant_58108" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4153" name="__module.model.model.decoder.layers.18.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2506"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4154" name="self.model.model.decoder.layers.18.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="221189600" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4155" name="Convert_1612155" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4156" name="self.model.model.decoder.layers.18.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="221713888" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4157" name="Convert_1612158" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4158" name="self.model.model.decoder.layers.18.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4159" name="self.model.model.decoder.layers.18.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="221717984" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4160" name="self.model.model.decoder.layers.18.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4161" name="Constant_1612163" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4162" name="Reshape_1612164" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4163" name="self.model.model.decoder.layers.18.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4164" name="__module.model.model.decoder.layers.18.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4165" name="Constant_54776" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="221734368" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4166" name="__module.model.model.decoder.layers.18.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2509,input.149"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4167" name="__module.model.model.decoder.layers.18/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2511,residual.113"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4168" name="__module.model.model.decoder.layers.18.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4169" name="__module.model.model.decoder.layers.18.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4170" name="Constant_54777" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="221738464" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4171" name="__module.model.model.decoder.layers.18.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4172" name="Constant_54778" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="221742560" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4173" name="__module.model.model.decoder.layers.18.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2515"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4174" name="self.model.model.decoder.layers.18.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="221746656" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4175" name="Convert_868428" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4176" name="self.model.model.decoder.layers.18.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="223843808" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4177" name="Convert_868431" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4178" name="self.model.model.decoder.layers.18.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4179" name="self.model.model.decoder.layers.18.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="223860192" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4180" name="self.model.model.decoder.layers.18.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4181" name="Constant_868436" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4182" name="Reshape_868437" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4183" name="self.model.model.decoder.layers.18.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4184" name="__module.model.model.decoder.layers.18.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4185" name="Constant_54779" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="223925728" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4186" name="__module.model.model.decoder.layers.18.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="2518"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4187" name="__module.model.model.decoder.layers.18.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="2519,input.151"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4188" name="self.model.model.decoder.layers.18.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="223942112" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4189" name="Convert_872727" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4190" name="self.model.model.decoder.layers.18.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="226039264" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4191" name="Convert_872730" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4192" name="self.model.model.decoder.layers.18.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4193" name="self.model.model.decoder.layers.18.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="226055648" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4194" name="self.model.model.decoder.layers.18.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4195" name="Constant_872735" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4196" name="Reshape_872736" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4197" name="self.model.model.decoder.layers.18.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4198" name="__module.model.model.decoder.layers.18.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4199" name="Constant_54780" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="226121184" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4200" name="__module.model.model.decoder.layers.18.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2523,input.153"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4201" name="__module.model.model.decoder.layers.18/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2525,2527,residual.115"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4202" name="__module.model.model.decoder.layers.19.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4203" name="__module.model.model.decoder.layers.19.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4204" name="Constant_54781" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="226125280" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4205" name="__module.model.model.decoder.layers.19.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4206" name="Constant_54782" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="226129376" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4207" name="__module.model.model.decoder.layers.19.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2540,hidden_states.191"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4208" name="self.model.model.decoder.layers.19.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="226133472" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4209" name="Convert_1625052" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4210" name="self.model.model.decoder.layers.19.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="226657760" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4211" name="Convert_1625055" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4212" name="self.model.model.decoder.layers.19.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4213" name="self.model.model.decoder.layers.19.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="226661856" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4214" name="self.model.model.decoder.layers.19.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4215" name="Constant_1625060" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4216" name="Reshape_1625061" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4217" name="self.model.model.decoder.layers.19.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4218" name="__module.model.model.decoder.layers.19.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4219" name="Constant_54783" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="226678240" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4220" name="__module.model.model.decoder.layers.19.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2549,tensor.229"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4221" name="Constant_58109" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4222" name="__module.model.model.decoder.layers.19.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2551"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4223" name="__module.model.model.decoder.layers.19.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4224" name="__module.model.model.decoder.layers.19.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2552"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4225" name="Constant_60913" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4226" name="Constant_60906" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4227" name="Constant_60908" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4228" name="Constant_60910" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4229" name="Concat_60911" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4230" name="Broadcast_60914" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4231" name="ReadValue_59985" type="ReadValue" version="opset6"> <data variable_id="past_key_values.19.decoder.keypresent.19.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.19.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4232" name="Constant_59530" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4233" name="Gather_59531" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4234" name="self.model.model.decoder.layers.19.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="226682336" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4235" name="Convert_1620753" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4236" name="self.model.model.decoder.layers.19.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="227206624" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4237" name="Convert_1620756" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4238" name="self.model.model.decoder.layers.19.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4239" name="self.model.model.decoder.layers.19.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="227210720" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4240" name="self.model.model.decoder.layers.19.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4241" name="Constant_1620761" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4242" name="Reshape_1620762" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4243" name="self.model.model.decoder.layers.19.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4244" name="__module.model.model.decoder.layers.19.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2555,tensor.231"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4245" name="Constant_58110" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4246" name="__module.model.model.decoder.layers.19.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2557"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4247" name="__module.model.model.decoder.layers.19.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4248" name="__module.model.model.decoder.layers.19.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2558"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4249" name="__module.model.model.decoder.layers.19.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.47"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4250" name="Constant_60901" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4251" name="Constant_60894" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4252" name="Constant_60896" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4253" name="Constant_60898" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4254" name="Concat_60899" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4255" name="Broadcast_60902" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4256" name="ReadValue_59987" type="ReadValue" version="opset6"> <data variable_id="past_key_values.19.decoder.valuepresent.19.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.19.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4257" name="Constant_59533" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4258" name="Gather_59534" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4259" name="self.model.model.decoder.layers.19.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="227227104" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4260" name="Convert_1616454" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4261" name="self.model.model.decoder.layers.19.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="227751392" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4262" name="Convert_1616457" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4263" name="self.model.model.decoder.layers.19.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4264" name="self.model.model.decoder.layers.19.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="227755488" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4265" name="self.model.model.decoder.layers.19.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4266" name="Constant_1616462" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4267" name="Reshape_1616463" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4268" name="self.model.model.decoder.layers.19.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4269" name="__module.model.model.decoder.layers.19.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4270" name="Constant_54784" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="227771872" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4271" name="__module.model.model.decoder.layers.19.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2562,tensor.233"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4272" name="Constant_58111" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4273" name="__module.model.model.decoder.layers.19.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2564"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4274" name="__module.model.model.decoder.layers.19.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4275" name="__module.model.model.decoder.layers.19.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2565"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4276" name="__module.model.model.decoder.layers.19.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4277" name="__module.model.model.decoder.layers.19.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2576,attn_output.153"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4278" name="__module.model.model.decoder.layers.19.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4279" name="__module.model.model.decoder.layers.19.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2577,attn_output.155"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4280" name="Constant_58112" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4281" name="__module.model.model.decoder.layers.19.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2579"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4282" name="self.model.model.decoder.layers.19.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="227775968" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4283" name="Convert_1629351" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4284" name="self.model.model.decoder.layers.19.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="228300256" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4285" name="Convert_1629354" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4286" name="self.model.model.decoder.layers.19.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4287" name="self.model.model.decoder.layers.19.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="228304352" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4288" name="self.model.model.decoder.layers.19.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4289" name="Constant_1629359" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4290" name="Reshape_1629360" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4291" name="self.model.model.decoder.layers.19.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4292" name="__module.model.model.decoder.layers.19.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4293" name="Constant_54785" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="228320736" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4294" name="__module.model.model.decoder.layers.19.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2582,2584,input.155"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4295" name="__module.model.model.decoder.layers.19/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2588,residual.117"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4296" name="__module.model.model.decoder.layers.19.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4297" name="__module.model.model.decoder.layers.19.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4298" name="Constant_54786" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="228324832" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4299" name="__module.model.model.decoder.layers.19.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4300" name="Constant_54787" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="228328928" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4301" name="__module.model.model.decoder.layers.19.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2592,hidden_states.195"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4302" name="self.model.model.decoder.layers.19.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="228333024" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4303" name="Convert_1633650" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4304" name="self.model.model.decoder.layers.19.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="228857312" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4305" name="Convert_1633653" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4306" name="self.model.model.decoder.layers.19.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4307" name="self.model.model.decoder.layers.19.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="228861408" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4308" name="self.model.model.decoder.layers.19.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4309" name="Constant_1633658" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4310" name="Reshape_1633659" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4311" name="self.model.model.decoder.layers.19.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4312" name="__module.model.model.decoder.layers.19.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4313" name="Constant_54788" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="228877792" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4314" name="__module.model.model.decoder.layers.19.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2601,tensor.235"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4315" name="Constant_58113" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4316" name="__module.model.model.decoder.layers.19.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2603"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4317" name="__module.model.model.decoder.layers.19.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4318" name="__module.model.model.decoder.layers.19.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2604"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4319" name="__module.model.model.decoder.layers.19.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="2619,attn_output.157"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4320" name="__module.model.model.decoder.layers.19.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4321" name="__module.model.model.decoder.layers.19.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2620,attn_output.159"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4322" name="Constant_58116" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4323" name="__module.model.model.decoder.layers.19.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2622"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4324" name="self.model.model.decoder.layers.19.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="228881888" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4325" name="Convert_1637949" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4326" name="self.model.model.decoder.layers.19.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="229406176" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4327" name="Convert_1637952" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4328" name="self.model.model.decoder.layers.19.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4329" name="self.model.model.decoder.layers.19.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="229410272" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4330" name="self.model.model.decoder.layers.19.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4331" name="Constant_1637957" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4332" name="Reshape_1637958" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4333" name="self.model.model.decoder.layers.19.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4334" name="__module.model.model.decoder.layers.19.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4335" name="Constant_54790" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="229426656" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4336" name="__module.model.model.decoder.layers.19.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2625,input.157"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4337" name="__module.model.model.decoder.layers.19/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2627,residual.119"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4338" name="__module.model.model.decoder.layers.19.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4339" name="__module.model.model.decoder.layers.19.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4340" name="Constant_54791" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="229430752" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4341" name="__module.model.model.decoder.layers.19.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4342" name="Constant_54792" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="229434848" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4343" name="__module.model.model.decoder.layers.19.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2631"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4344" name="self.model.model.decoder.layers.19.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="229438944" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4345" name="Convert_877026" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4346" name="self.model.model.decoder.layers.19.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="231536096" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4347" name="Convert_877029" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4348" name="self.model.model.decoder.layers.19.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4349" name="self.model.model.decoder.layers.19.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="231552480" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4350" name="self.model.model.decoder.layers.19.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4351" name="Constant_877034" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4352" name="Reshape_877035" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4353" name="self.model.model.decoder.layers.19.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4354" name="__module.model.model.decoder.layers.19.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4355" name="Constant_54793" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="231618016" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4356" name="__module.model.model.decoder.layers.19.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="2634"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4357" name="__module.model.model.decoder.layers.19.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="2635,input.159"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4358" name="self.model.model.decoder.layers.19.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="231634400" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4359" name="Convert_881325" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4360" name="self.model.model.decoder.layers.19.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="233731552" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4361" name="Convert_881328" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4362" name="self.model.model.decoder.layers.19.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4363" name="self.model.model.decoder.layers.19.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="233747936" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4364" name="self.model.model.decoder.layers.19.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4365" name="Constant_881333" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4366" name="Reshape_881334" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4367" name="self.model.model.decoder.layers.19.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4368" name="__module.model.model.decoder.layers.19.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4369" name="Constant_54794" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="233813472" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4370" name="__module.model.model.decoder.layers.19.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2639,input.161"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4371" name="__module.model.model.decoder.layers.19/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2641,2643,residual.121"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4372" name="__module.model.model.decoder.layers.20.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4373" name="__module.model.model.decoder.layers.20.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4374" name="Constant_54795" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="233817568" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4375" name="__module.model.model.decoder.layers.20.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4376" name="Constant_54796" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="233821664" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4377" name="__module.model.model.decoder.layers.20.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2656,hidden_states.201"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4378" name="self.model.model.decoder.layers.20.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="233825760" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4379" name="Convert_1650846" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4380" name="self.model.model.decoder.layers.20.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="234350048" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4381" name="Convert_1650849" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4382" name="self.model.model.decoder.layers.20.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4383" name="self.model.model.decoder.layers.20.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="234354144" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4384" name="self.model.model.decoder.layers.20.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4385" name="Constant_1650854" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4386" name="Reshape_1650855" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4387" name="self.model.model.decoder.layers.20.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4388" name="__module.model.model.decoder.layers.20.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4389" name="Constant_54797" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="234370528" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4390" name="__module.model.model.decoder.layers.20.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2665,tensor.241"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4391" name="Constant_58117" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4392" name="__module.model.model.decoder.layers.20.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2667"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4393" name="__module.model.model.decoder.layers.20.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4394" name="__module.model.model.decoder.layers.20.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2668"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4395" name="Constant_60937" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4396" name="Constant_60930" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4397" name="Constant_60932" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4398" name="Constant_60934" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4399" name="Concat_60935" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4400" name="Broadcast_60938" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4401" name="ReadValue_59993" type="ReadValue" version="opset6"> <data variable_id="past_key_values.20.decoder.keypresent.20.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.20.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4402" name="Constant_59536" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4403" name="Gather_59537" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4404" name="self.model.model.decoder.layers.20.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="234374624" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4405" name="Convert_1646547" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4406" name="self.model.model.decoder.layers.20.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="234898912" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4407" name="Convert_1646550" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4408" name="self.model.model.decoder.layers.20.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4409" name="self.model.model.decoder.layers.20.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="234903008" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4410" name="self.model.model.decoder.layers.20.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4411" name="Constant_1646555" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4412" name="Reshape_1646556" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4413" name="self.model.model.decoder.layers.20.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4414" name="__module.model.model.decoder.layers.20.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2671,tensor.243"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4415" name="Constant_58118" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4416" name="__module.model.model.decoder.layers.20.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2673"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4417" name="__module.model.model.decoder.layers.20.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4418" name="__module.model.model.decoder.layers.20.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2674"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4419" name="__module.model.model.decoder.layers.20.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.49"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4420" name="Constant_60925" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4421" name="Constant_60918" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4422" name="Constant_60920" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4423" name="Constant_60922" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4424" name="Concat_60923" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4425" name="Broadcast_60926" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4426" name="ReadValue_59995" type="ReadValue" version="opset6"> <data variable_id="past_key_values.20.decoder.valuepresent.20.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.20.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4427" name="Constant_59539" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4428" name="Gather_59540" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4429" name="self.model.model.decoder.layers.20.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="234919392" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4430" name="Convert_1642248" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4431" name="self.model.model.decoder.layers.20.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="235443680" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4432" name="Convert_1642251" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4433" name="self.model.model.decoder.layers.20.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4434" name="self.model.model.decoder.layers.20.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="235447776" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4435" name="self.model.model.decoder.layers.20.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4436" name="Constant_1642256" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4437" name="Reshape_1642257" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4438" name="self.model.model.decoder.layers.20.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4439" name="__module.model.model.decoder.layers.20.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4440" name="Constant_54798" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="235464160" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4441" name="__module.model.model.decoder.layers.20.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2678,tensor.245"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4442" name="Constant_58119" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4443" name="__module.model.model.decoder.layers.20.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2680"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4444" name="__module.model.model.decoder.layers.20.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4445" name="__module.model.model.decoder.layers.20.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2681"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4446" name="__module.model.model.decoder.layers.20.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4447" name="__module.model.model.decoder.layers.20.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2692,attn_output.161"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4448" name="__module.model.model.decoder.layers.20.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4449" name="__module.model.model.decoder.layers.20.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2693,attn_output.163"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4450" name="Constant_58120" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4451" name="__module.model.model.decoder.layers.20.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2695"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4452" name="self.model.model.decoder.layers.20.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="235468256" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4453" name="Convert_1655145" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4454" name="self.model.model.decoder.layers.20.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="235992544" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4455" name="Convert_1655148" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4456" name="self.model.model.decoder.layers.20.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4457" name="self.model.model.decoder.layers.20.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="235996640" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4458" name="self.model.model.decoder.layers.20.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4459" name="Constant_1655153" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4460" name="Reshape_1655154" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4461" name="self.model.model.decoder.layers.20.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4462" name="__module.model.model.decoder.layers.20.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4463" name="Constant_54799" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="236013024" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4464" name="__module.model.model.decoder.layers.20.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2698,2700,input.163"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4465" name="__module.model.model.decoder.layers.20/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2704,residual.123"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4466" name="__module.model.model.decoder.layers.20.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4467" name="__module.model.model.decoder.layers.20.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4468" name="Constant_54800" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="236017120" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4469" name="__module.model.model.decoder.layers.20.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4470" name="Constant_54801" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="236021216" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4471" name="__module.model.model.decoder.layers.20.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2708,hidden_states.205"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4472" name="self.model.model.decoder.layers.20.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="236025312" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4473" name="Convert_1659444" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4474" name="self.model.model.decoder.layers.20.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="236549600" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4475" name="Convert_1659447" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4476" name="self.model.model.decoder.layers.20.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4477" name="self.model.model.decoder.layers.20.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="236553696" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4478" name="self.model.model.decoder.layers.20.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4479" name="Constant_1659452" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4480" name="Reshape_1659453" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4481" name="self.model.model.decoder.layers.20.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4482" name="__module.model.model.decoder.layers.20.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4483" name="Constant_54802" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="236570080" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4484" name="__module.model.model.decoder.layers.20.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2717,tensor.247"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4485" name="Constant_58121" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4486" name="__module.model.model.decoder.layers.20.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2719"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4487" name="__module.model.model.decoder.layers.20.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4488" name="__module.model.model.decoder.layers.20.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2720"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4489" name="__module.model.model.decoder.layers.20.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="2735,attn_output.165"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4490" name="__module.model.model.decoder.layers.20.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4491" name="__module.model.model.decoder.layers.20.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2736,attn_output.167"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4492" name="Constant_58124" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4493" name="__module.model.model.decoder.layers.20.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2738"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4494" name="self.model.model.decoder.layers.20.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="236574176" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4495" name="Convert_1663743" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4496" name="self.model.model.decoder.layers.20.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="237098464" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4497" name="Convert_1663746" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4498" name="self.model.model.decoder.layers.20.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4499" name="self.model.model.decoder.layers.20.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="237102560" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4500" name="self.model.model.decoder.layers.20.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4501" name="Constant_1663751" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4502" name="Reshape_1663752" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4503" name="self.model.model.decoder.layers.20.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4504" name="__module.model.model.decoder.layers.20.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4505" name="Constant_54804" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="237118944" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4506" name="__module.model.model.decoder.layers.20.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2741,input.165"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4507" name="__module.model.model.decoder.layers.20/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2743,residual.125"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4508" name="__module.model.model.decoder.layers.20.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4509" name="__module.model.model.decoder.layers.20.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4510" name="Constant_54805" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="237123040" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4511" name="__module.model.model.decoder.layers.20.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4512" name="Constant_54806" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="237127136" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4513" name="__module.model.model.decoder.layers.20.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2747"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4514" name="self.model.model.decoder.layers.20.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="237131232" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4515" name="Convert_885624" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4516" name="self.model.model.decoder.layers.20.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="239228384" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4517" name="Convert_885627" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4518" name="self.model.model.decoder.layers.20.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4519" name="self.model.model.decoder.layers.20.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="239244768" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4520" name="self.model.model.decoder.layers.20.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4521" name="Constant_885632" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4522" name="Reshape_885633" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4523" name="self.model.model.decoder.layers.20.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4524" name="__module.model.model.decoder.layers.20.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4525" name="Constant_54807" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="239310304" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4526" name="__module.model.model.decoder.layers.20.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="2750"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4527" name="__module.model.model.decoder.layers.20.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="2751,input.167"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4528" name="self.model.model.decoder.layers.20.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="239326688" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4529" name="Convert_889923" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4530" name="self.model.model.decoder.layers.20.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="241423840" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4531" name="Convert_889926" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4532" name="self.model.model.decoder.layers.20.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4533" name="self.model.model.decoder.layers.20.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="241440224" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4534" name="self.model.model.decoder.layers.20.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4535" name="Constant_889931" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4536" name="Reshape_889932" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4537" name="self.model.model.decoder.layers.20.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4538" name="__module.model.model.decoder.layers.20.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4539" name="Constant_54808" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="241505760" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4540" name="__module.model.model.decoder.layers.20.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2755,input.169"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4541" name="__module.model.model.decoder.layers.20/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2757,2759,residual.127"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4542" name="__module.model.model.decoder.layers.21.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4543" name="__module.model.model.decoder.layers.21.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4544" name="Constant_54809" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="241509856" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4545" name="__module.model.model.decoder.layers.21.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4546" name="Constant_54810" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="241513952" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4547" name="__module.model.model.decoder.layers.21.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2772,hidden_states.211"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4548" name="self.model.model.decoder.layers.21.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="241518048" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4549" name="Convert_1676640" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4550" name="self.model.model.decoder.layers.21.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="242042336" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4551" name="Convert_1676643" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4552" name="self.model.model.decoder.layers.21.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4553" name="self.model.model.decoder.layers.21.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="242046432" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4554" name="self.model.model.decoder.layers.21.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4555" name="Constant_1676648" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4556" name="Reshape_1676649" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4557" name="self.model.model.decoder.layers.21.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4558" name="__module.model.model.decoder.layers.21.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4559" name="Constant_54811" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="242062816" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4560" name="__module.model.model.decoder.layers.21.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2781,tensor.253"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4561" name="Constant_58125" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4562" name="__module.model.model.decoder.layers.21.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2783"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4563" name="__module.model.model.decoder.layers.21.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4564" name="__module.model.model.decoder.layers.21.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2784"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4565" name="Constant_60961" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4566" name="Constant_60954" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4567" name="Constant_60956" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4568" name="Constant_60958" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4569" name="Concat_60959" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4570" name="Broadcast_60962" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4571" name="ReadValue_59997" type="ReadValue" version="opset6"> <data variable_id="past_key_values.21.decoder.keypresent.21.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.21.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4572" name="Constant_59542" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4573" name="Gather_59543" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4574" name="self.model.model.decoder.layers.21.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="242066912" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4575" name="Convert_1672341" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4576" name="self.model.model.decoder.layers.21.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="242591200" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4577" name="Convert_1672344" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4578" name="self.model.model.decoder.layers.21.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4579" name="self.model.model.decoder.layers.21.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="242595296" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4580" name="self.model.model.decoder.layers.21.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4581" name="Constant_1672349" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4582" name="Reshape_1672350" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4583" name="self.model.model.decoder.layers.21.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4584" name="__module.model.model.decoder.layers.21.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2787,tensor.255"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4585" name="Constant_58126" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4586" name="__module.model.model.decoder.layers.21.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2789"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4587" name="__module.model.model.decoder.layers.21.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4588" name="__module.model.model.decoder.layers.21.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2790"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4589" name="__module.model.model.decoder.layers.21.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.51"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4590" name="Constant_60949" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4591" name="Constant_60942" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4592" name="Constant_60944" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4593" name="Constant_60946" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4594" name="Concat_60947" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4595" name="Broadcast_60950" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4596" name="ReadValue_59999" type="ReadValue" version="opset6"> <data variable_id="past_key_values.21.decoder.valuepresent.21.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.21.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4597" name="Constant_59545" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4598" name="Gather_59546" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4599" name="self.model.model.decoder.layers.21.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="242611680" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4600" name="Convert_1668042" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4601" name="self.model.model.decoder.layers.21.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="243135968" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4602" name="Convert_1668045" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4603" name="self.model.model.decoder.layers.21.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4604" name="self.model.model.decoder.layers.21.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="243140064" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4605" name="self.model.model.decoder.layers.21.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4606" name="Constant_1668050" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4607" name="Reshape_1668051" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4608" name="self.model.model.decoder.layers.21.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4609" name="__module.model.model.decoder.layers.21.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4610" name="Constant_54812" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="243156448" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4611" name="__module.model.model.decoder.layers.21.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2794,tensor.257"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4612" name="Constant_58127" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4613" name="__module.model.model.decoder.layers.21.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2796"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4614" name="__module.model.model.decoder.layers.21.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4615" name="__module.model.model.decoder.layers.21.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2797"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4616" name="__module.model.model.decoder.layers.21.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4617" name="__module.model.model.decoder.layers.21.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2808,attn_output.169"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4618" name="__module.model.model.decoder.layers.21.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4619" name="__module.model.model.decoder.layers.21.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2809,attn_output.171"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4620" name="Constant_58128" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4621" name="__module.model.model.decoder.layers.21.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2811"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4622" name="self.model.model.decoder.layers.21.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="243160544" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4623" name="Convert_1680939" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4624" name="self.model.model.decoder.layers.21.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="243684832" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4625" name="Convert_1680942" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4626" name="self.model.model.decoder.layers.21.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4627" name="self.model.model.decoder.layers.21.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="243688928" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4628" name="self.model.model.decoder.layers.21.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4629" name="Constant_1680947" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4630" name="Reshape_1680948" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4631" name="self.model.model.decoder.layers.21.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4632" name="__module.model.model.decoder.layers.21.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4633" name="Constant_54813" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="243705312" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4634" name="__module.model.model.decoder.layers.21.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2814,2816,input.171"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4635" name="__module.model.model.decoder.layers.21/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2820,residual.129"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4636" name="__module.model.model.decoder.layers.21.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4637" name="__module.model.model.decoder.layers.21.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4638" name="Constant_54814" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="243709408" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4639" name="__module.model.model.decoder.layers.21.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4640" name="Constant_54815" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="243713504" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4641" name="__module.model.model.decoder.layers.21.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2824,hidden_states.215"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4642" name="self.model.model.decoder.layers.21.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="243717600" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4643" name="Convert_1685238" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4644" name="self.model.model.decoder.layers.21.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="244241888" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4645" name="Convert_1685241" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4646" name="self.model.model.decoder.layers.21.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4647" name="self.model.model.decoder.layers.21.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="244245984" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4648" name="self.model.model.decoder.layers.21.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4649" name="Constant_1685246" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4650" name="Reshape_1685247" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4651" name="self.model.model.decoder.layers.21.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4652" name="__module.model.model.decoder.layers.21.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4653" name="Constant_54816" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="244262368" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4654" name="__module.model.model.decoder.layers.21.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2833,tensor.259"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4655" name="Constant_58129" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4656" name="__module.model.model.decoder.layers.21.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2835"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4657" name="__module.model.model.decoder.layers.21.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4658" name="__module.model.model.decoder.layers.21.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2836"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4659" name="__module.model.model.decoder.layers.21.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="2851,attn_output.173"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4660" name="__module.model.model.decoder.layers.21.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4661" name="__module.model.model.decoder.layers.21.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2852,attn_output.175"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4662" name="Constant_58132" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4663" name="__module.model.model.decoder.layers.21.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2854"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4664" name="self.model.model.decoder.layers.21.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="244266464" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4665" name="Convert_1689537" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4666" name="self.model.model.decoder.layers.21.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="244790752" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4667" name="Convert_1689540" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4668" name="self.model.model.decoder.layers.21.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4669" name="self.model.model.decoder.layers.21.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="244794848" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4670" name="self.model.model.decoder.layers.21.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4671" name="Constant_1689545" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4672" name="Reshape_1689546" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4673" name="self.model.model.decoder.layers.21.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4674" name="__module.model.model.decoder.layers.21.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4675" name="Constant_54818" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="244811232" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4676" name="__module.model.model.decoder.layers.21.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2857,input.173"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4677" name="__module.model.model.decoder.layers.21/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2859,residual.131"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4678" name="__module.model.model.decoder.layers.21.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4679" name="__module.model.model.decoder.layers.21.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4680" name="Constant_54819" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="244815328" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4681" name="__module.model.model.decoder.layers.21.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4682" name="Constant_54820" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="244819424" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4683" name="__module.model.model.decoder.layers.21.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2863"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4684" name="self.model.model.decoder.layers.21.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="244823520" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4685" name="Convert_894222" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4686" name="self.model.model.decoder.layers.21.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="246920672" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4687" name="Convert_894225" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4688" name="self.model.model.decoder.layers.21.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4689" name="self.model.model.decoder.layers.21.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="246937056" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4690" name="self.model.model.decoder.layers.21.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4691" name="Constant_894230" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4692" name="Reshape_894231" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4693" name="self.model.model.decoder.layers.21.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4694" name="__module.model.model.decoder.layers.21.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4695" name="Constant_54821" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="247002592" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4696" name="__module.model.model.decoder.layers.21.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="2866"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4697" name="__module.model.model.decoder.layers.21.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="2867,input.175"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4698" name="self.model.model.decoder.layers.21.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="247018976" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4699" name="Convert_898521" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4700" name="self.model.model.decoder.layers.21.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="249116128" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4701" name="Convert_898524" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4702" name="self.model.model.decoder.layers.21.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4703" name="self.model.model.decoder.layers.21.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="249132512" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4704" name="self.model.model.decoder.layers.21.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4705" name="Constant_898529" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4706" name="Reshape_898530" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4707" name="self.model.model.decoder.layers.21.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4708" name="__module.model.model.decoder.layers.21.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4709" name="Constant_54822" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="249198048" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4710" name="__module.model.model.decoder.layers.21.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2871,input.177"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4711" name="__module.model.model.decoder.layers.21/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2873,2875,residual.133"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4712" name="__module.model.model.decoder.layers.22.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4713" name="__module.model.model.decoder.layers.22.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4714" name="Constant_54823" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="249202144" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4715" name="__module.model.model.decoder.layers.22.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4716" name="Constant_54824" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="249206240" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4717" name="__module.model.model.decoder.layers.22.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2888,hidden_states.221"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4718" name="self.model.model.decoder.layers.22.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="249210336" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4719" name="Convert_1702434" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4720" name="self.model.model.decoder.layers.22.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="249734624" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4721" name="Convert_1702437" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4722" name="self.model.model.decoder.layers.22.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4723" name="self.model.model.decoder.layers.22.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="249738720" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4724" name="self.model.model.decoder.layers.22.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4725" name="Constant_1702442" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4726" name="Reshape_1702443" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4727" name="self.model.model.decoder.layers.22.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4728" name="__module.model.model.decoder.layers.22.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4729" name="Constant_54825" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="249755104" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4730" name="__module.model.model.decoder.layers.22.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2897,tensor.265"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4731" name="Constant_58133" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4732" name="__module.model.model.decoder.layers.22.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2899"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4733" name="__module.model.model.decoder.layers.22.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4734" name="__module.model.model.decoder.layers.22.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2900"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4735" name="Constant_60985" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4736" name="Constant_60978" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4737" name="Constant_60980" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4738" name="Constant_60982" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4739" name="Concat_60983" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4740" name="Broadcast_60986" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4741" name="ReadValue_60001" type="ReadValue" version="opset6"> <data variable_id="past_key_values.22.decoder.keypresent.22.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.22.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4742" name="Constant_59548" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4743" name="Gather_59549" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4744" name="self.model.model.decoder.layers.22.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="249759200" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4745" name="Convert_1698135" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4746" name="self.model.model.decoder.layers.22.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="250283488" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4747" name="Convert_1698138" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4748" name="self.model.model.decoder.layers.22.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4749" name="self.model.model.decoder.layers.22.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="250287584" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4750" name="self.model.model.decoder.layers.22.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4751" name="Constant_1698143" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4752" name="Reshape_1698144" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4753" name="self.model.model.decoder.layers.22.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4754" name="__module.model.model.decoder.layers.22.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2903,tensor.267"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4755" name="Constant_58134" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4756" name="__module.model.model.decoder.layers.22.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2905"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4757" name="__module.model.model.decoder.layers.22.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4758" name="__module.model.model.decoder.layers.22.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2906"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4759" name="__module.model.model.decoder.layers.22.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states.53"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4760" name="Constant_60973" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4761" name="Constant_60966" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4762" name="Constant_60968" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4763" name="Constant_60970" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4764" name="Concat_60971" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4765" name="Broadcast_60974" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4766" name="ReadValue_60003" type="ReadValue" version="opset6"> <data variable_id="past_key_values.22.decoder.valuepresent.22.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.22.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4767" name="Constant_59551" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4768" name="Gather_59552" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4769" name="self.model.model.decoder.layers.22.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="250303968" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4770" name="Convert_1693836" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4771" name="self.model.model.decoder.layers.22.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="250828256" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4772" name="Convert_1693839" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4773" name="self.model.model.decoder.layers.22.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4774" name="self.model.model.decoder.layers.22.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="250832352" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4775" name="self.model.model.decoder.layers.22.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4776" name="Constant_1693844" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4777" name="Reshape_1693845" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4778" name="self.model.model.decoder.layers.22.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4779" name="__module.model.model.decoder.layers.22.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4780" name="Constant_54826" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="250848736" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4781" name="__module.model.model.decoder.layers.22.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2910,tensor.269"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4782" name="Constant_58135" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4783" name="__module.model.model.decoder.layers.22.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2912"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4784" name="__module.model.model.decoder.layers.22.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4785" name="__module.model.model.decoder.layers.22.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2913"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4786" name="__module.model.model.decoder.layers.22.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4787" name="__module.model.model.decoder.layers.22.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2924,attn_output.177"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4788" name="__module.model.model.decoder.layers.22.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4789" name="__module.model.model.decoder.layers.22.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2925,attn_output.179"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4790" name="Constant_58136" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4791" name="__module.model.model.decoder.layers.22.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2927"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4792" name="self.model.model.decoder.layers.22.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="250852832" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4793" name="Convert_1706733" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4794" name="self.model.model.decoder.layers.22.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="251377120" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4795" name="Convert_1706736" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4796" name="self.model.model.decoder.layers.22.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4797" name="self.model.model.decoder.layers.22.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="251381216" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4798" name="self.model.model.decoder.layers.22.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4799" name="Constant_1706741" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4800" name="Reshape_1706742" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4801" name="self.model.model.decoder.layers.22.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4802" name="__module.model.model.decoder.layers.22.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4803" name="Constant_54827" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="251397600" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4804" name="__module.model.model.decoder.layers.22.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2930,2932,input.179"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4805" name="__module.model.model.decoder.layers.22/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2936,residual.135"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4806" name="__module.model.model.decoder.layers.22.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4807" name="__module.model.model.decoder.layers.22.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4808" name="Constant_54828" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="251401696" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4809" name="__module.model.model.decoder.layers.22.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4810" name="Constant_54829" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="251405792" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4811" name="__module.model.model.decoder.layers.22.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2940,hidden_states.225"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4812" name="self.model.model.decoder.layers.22.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="251409888" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4813" name="Convert_1711032" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4814" name="self.model.model.decoder.layers.22.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="251934176" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4815" name="Convert_1711035" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4816" name="self.model.model.decoder.layers.22.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4817" name="self.model.model.decoder.layers.22.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="251938272" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4818" name="self.model.model.decoder.layers.22.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4819" name="Constant_1711040" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4820" name="Reshape_1711041" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4821" name="self.model.model.decoder.layers.22.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4822" name="__module.model.model.decoder.layers.22.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4823" name="Constant_54830" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="251954656" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4824" name="__module.model.model.decoder.layers.22.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2949,tensor.271"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4825" name="Constant_58137" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4826" name="__module.model.model.decoder.layers.22.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2951"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4827" name="__module.model.model.decoder.layers.22.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4828" name="__module.model.model.decoder.layers.22.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2952"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4829" name="__module.model.model.decoder.layers.22.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="2967,attn_output.181"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4830" name="__module.model.model.decoder.layers.22.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4831" name="__module.model.model.decoder.layers.22.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2968,attn_output.183"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4832" name="Constant_58140" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4833" name="__module.model.model.decoder.layers.22.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2970"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4834" name="self.model.model.decoder.layers.22.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="251958752" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4835" name="Convert_1715331" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4836" name="self.model.model.decoder.layers.22.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="252483040" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4837" name="Convert_1715334" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4838" name="self.model.model.decoder.layers.22.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4839" name="self.model.model.decoder.layers.22.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="252487136" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4840" name="self.model.model.decoder.layers.22.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4841" name="Constant_1715339" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4842" name="Reshape_1715340" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4843" name="self.model.model.decoder.layers.22.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4844" name="__module.model.model.decoder.layers.22.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4845" name="Constant_54832" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="252503520" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4846" name="__module.model.model.decoder.layers.22.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2973,input.181"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4847" name="__module.model.model.decoder.layers.22/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2975,residual.137"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4848" name="__module.model.model.decoder.layers.22.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4849" name="__module.model.model.decoder.layers.22.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4850" name="Constant_54833" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="252507616" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4851" name="__module.model.model.decoder.layers.22.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4852" name="Constant_54834" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="252511712" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4853" name="__module.model.model.decoder.layers.22.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2979"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4854" name="self.model.model.decoder.layers.22.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="252515808" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4855" name="Convert_902820" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4856" name="self.model.model.decoder.layers.22.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="254612960" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4857" name="Convert_902823" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4858" name="self.model.model.decoder.layers.22.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4859" name="self.model.model.decoder.layers.22.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="254629344" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4860" name="self.model.model.decoder.layers.22.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4861" name="Constant_902828" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4862" name="Reshape_902829" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4863" name="self.model.model.decoder.layers.22.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4864" name="__module.model.model.decoder.layers.22.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4865" name="Constant_54835" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="254694880" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4866" name="__module.model.model.decoder.layers.22.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="2982"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4867" name="__module.model.model.decoder.layers.22.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="2983,input.183"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4868" name="self.model.model.decoder.layers.22.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="254711264" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4869" name="Convert_907119" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4870" name="self.model.model.decoder.layers.22.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="256808416" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4871" name="Convert_907122" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4872" name="self.model.model.decoder.layers.22.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4873" name="self.model.model.decoder.layers.22.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="256824800" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="4874" name="self.model.model.decoder.layers.22.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="4875" name="Constant_907127" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4876" name="Reshape_907128" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4877" name="self.model.model.decoder.layers.22.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="4878" name="__module.model.model.decoder.layers.22.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4879" name="Constant_54836" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="256890336" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4880" name="__module.model.model.decoder.layers.22.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2987,input.185"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4881" name="__module.model.model.decoder.layers.22/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="2989,2991,residual.139"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4882" name="__module.model.model.decoder.layers.23.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="4883" name="__module.model.model.decoder.layers.23.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4884" name="Constant_54837" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="256894432" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4885" name="__module.model.model.decoder.layers.23.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4886" name="Constant_54838" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="256898528" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4887" name="__module.model.model.decoder.layers.23.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3004,hidden_states.231"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4888" name="self.model.model.decoder.layers.23.self_attn.v_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="256902624" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4889" name="Convert_1719630" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4890" name="self.model.model.decoder.layers.23.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="257426912" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4891" name="Convert_1719633" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4892" name="self.model.model.decoder.layers.23.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4893" name="self.model.model.decoder.layers.23.self_attn.v_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="257431008" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4894" name="self.model.model.decoder.layers.23.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4895" name="Constant_1719638" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4896" name="Reshape_1719639" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4897" name="self.model.model.decoder.layers.23.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4898" name="__module.model.model.decoder.layers.23.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4899" name="Constant_54839" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="257447392" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4900" name="__module.model.model.decoder.layers.23.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3026,tensor.281"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4901" name="Constant_58141" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4902" name="__module.model.model.decoder.layers.23.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3028"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4903" name="__module.model.model.decoder.layers.23.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4904" name="__module.model.model.decoder.layers.23.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3029"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4905" name="__module.model.model.decoder.layers.23.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="present.23.decoder.value"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4907" name="Constant_60997" type="Const" version="opset1"> <data element_type="f32" shape="" offset="26247232" size="4" /> <output> <port id="0" precision="FP32" /> </output> </layer> <layer id="4908" name="Constant_60990" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247244" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4909" name="Constant_60992" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247236" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4910" name="Constant_60994" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="26247252" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4911" name="Concat_60995" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4912" name="Broadcast_60998" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </output> </layer> <layer id="4913" name="ReadValue_60005" type="ReadValue" version="opset6"> <data variable_id="past_key_values.23.decoder.keypresent.23.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>0</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.23.decoder.key"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4914" name="Constant_59554" type="Const" version="opset1"> <data element_type="i64" shape="" offset="26247236" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4915" name="Gather_59555" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4916" name="self.model.model.decoder.layers.23.self_attn.k_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="257451488" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4917" name="Convert_1723929" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4918" name="self.model.model.decoder.layers.23.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="257975776" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4919" name="Convert_1723932" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4920" name="self.model.model.decoder.layers.23.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4921" name="self.model.model.decoder.layers.23.self_attn.k_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="257979872" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4922" name="self.model.model.decoder.layers.23.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4923" name="Constant_1723937" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4924" name="Reshape_1723938" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4925" name="self.model.model.decoder.layers.23.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4926" name="__module.model.model.decoder.layers.23.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3019,tensor.279"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4927" name="Constant_58142" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4928" name="__module.model.model.decoder.layers.23.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3021"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4929" name="__module.model.model.decoder.layers.23.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4930" name="__module.model.model.decoder.layers.23.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3022"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4931" name="__module.model.model.decoder.layers.23.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="2" precision="FP32" names="key_states"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4965" name="self.model.model.decoder.layers.23.self_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="257996256" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4966" name="Convert_1728228" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4967" name="self.model.model.decoder.layers.23.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="258520544" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4968" name="Convert_1728231" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4969" name="self.model.model.decoder.layers.23.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4970" name="self.model.model.decoder.layers.23.self_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="258524640" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4971" name="self.model.model.decoder.layers.23.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4972" name="Constant_1728236" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4973" name="Reshape_1728237" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4974" name="self.model.model.decoder.layers.23.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4975" name="__module.model.model.decoder.layers.23.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4976" name="Constant_54840" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="258541024" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4977" name="__module.model.model.decoder.layers.23.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3013,tensor.277"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4978" name="Constant_58143" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4979" name="__module.model.model.decoder.layers.23.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3015"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4980" name="__module.model.model.decoder.layers.23.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4981" name="__module.model.model.decoder.layers.23.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3016"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4982" name="__module.model.model.decoder.layers.23.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3040,attn_output.185"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4983" name="__module.model.model.decoder.layers.23.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4984" name="__module.model.model.decoder.layers.23.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3041,attn_output.187"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="4985" name="Constant_58144" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4986" name="__module.model.model.decoder.layers.23.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3043"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4987" name="self.model.model.decoder.layers.23.self_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="258545120" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4988" name="Convert_1732527" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4989" name="self.model.model.decoder.layers.23.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="259069408" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4990" name="Convert_1732530" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4991" name="self.model.model.decoder.layers.23.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4992" name="self.model.model.decoder.layers.23.self_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="259073504" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="4993" name="self.model.model.decoder.layers.23.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="4994" name="Constant_1732535" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="4995" name="Reshape_1732536" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4996" name="self.model.model.decoder.layers.23.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4997" name="__module.model.model.decoder.layers.23.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4998" name="Constant_54841" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="259089888" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="4999" name="__module.model.model.decoder.layers.23.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3046,3048,input.187"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5000" name="__module.model.model.decoder.layers.23/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3052,residual.141"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5001" name="__module.model.model.decoder.layers.23.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="5002" name="__module.model.model.decoder.layers.23.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5003" name="Constant_54842" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="259093984" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5004" name="__module.model.model.decoder.layers.23.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5005" name="Constant_54843" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="259098080" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5006" name="__module.model.model.decoder.layers.23.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3056,hidden_states.235"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5007" name="self.model.model.decoder.layers.23.encoder_attn.q_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="259102176" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5008" name="Convert_1736826" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5009" name="self.model.model.decoder.layers.23.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="259626464" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="5010" name="Convert_1736829" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="5011" name="self.model.model.decoder.layers.23.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5012" name="self.model.model.decoder.layers.23.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="259630560" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="5013" name="self.model.model.decoder.layers.23.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5014" name="Constant_1736834" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="5015" name="Reshape_1736835" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5016" name="self.model.model.decoder.layers.23.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5017" name="__module.model.model.decoder.layers.23.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5018" name="Constant_54844" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="259646944" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5019" name="__module.model.model.decoder.layers.23.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3065,tensor.283"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5020" name="Constant_58145" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="548880" size="32" /> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="5021" name="__module.model.model.decoder.layers.23.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3067"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="5022" name="__module.model.model.decoder.layers.23.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5023" name="__module.model.model.decoder.layers.23.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3068"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="5024" name="__module.model.model.decoder.layers.23.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="3" precision="FP32" names="3083,attn_output.189"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="5025" name="__module.model.model.decoder.layers.23.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="548912" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="5026" name="__module.model.model.decoder.layers.23.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3084,attn_output"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> </output> </layer> <layer id="5027" name="Constant_58148" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="81622440" size="24" /> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="5028" name="__module.model.model.decoder.layers.23.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16</dim> <dim>64</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3086"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5029" name="self.model.model.decoder.layers.23.encoder_attn.out_proj.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 128" offset="259651040" size="524288" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5030" name="Convert_1741125" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5031" name="self.model.model.decoder.layers.23.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 8, 1" offset="260175328" size="4096" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="5032" name="Convert_1741128" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="5033" name="self.model.model.decoder.layers.23.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5034" name="self.model.model.decoder.layers.23.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 8, 1" offset="260179424" size="16384" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="5035" name="self.model.model.decoder.layers.23.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5036" name="Constant_1741133" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="544768" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="5037" name="Reshape_1741134" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5038" name="self.model.model.decoder.layers.23.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5039" name="__module.model.model.decoder.layers.23.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5040" name="Constant_54846" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="260195808" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5041" name="__module.model.model.decoder.layers.23.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3089,input.189"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5042" name="__module.model.model.decoder.layers.23/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3091,residual"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5043" name="__module.model.model.decoder.layers.23.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="5044" name="__module.model.model.decoder.layers.23.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5045" name="Constant_54847" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="260199904" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5046" name="__module.model.model.decoder.layers.23.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5047" name="Constant_54848" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="260204000" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5048" name="__module.model.model.decoder.layers.23.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3095"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5049" name="self.model.model.decoder.layers.23.fc1.weight" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 128" offset="260208096" size="2097152" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5050" name="Convert_911418" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5051" name="self.model.model.decoder.layers.23.fc1.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="4096, 8, 1" offset="262305248" size="16384" /> <output> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="5052" name="Convert_911421" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="5053" name="self.model.model.decoder.layers.23.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5054" name="self.model.model.decoder.layers.23.fc1.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="4096, 8, 1" offset="262321632" size="65536" /> <output> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </output> </layer> <layer id="5055" name="self.model.model.decoder.layers.23.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> </output> </layer> <layer id="5056" name="Constant_911426" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="85464512" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="5057" name="Reshape_911427" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>8</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5058" name="self.model.model.decoder.layers.23.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5059" name="__module.model.model.decoder.layers.23.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>4096</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="5060" name="Constant_54849" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 4096" offset="262387168" size="16384" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="5061" name="__module.model.model.decoder.layers.23.fc1/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32" names="3098"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="5062" name="__module.model.model.decoder.layers.23.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> <data approximation_mode="ERF" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32" names="3099,input.191"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> </output> </layer> <layer id="5063" name="self.model.model.decoder.layers.23.fc2.weight" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 128" offset="262403552" size="2097152" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="5064" name="Convert_915717" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="5065" name="self.model.model.decoder.layers.23.fc2.weight/zero_point" type="Const" version="opset1"> <data element_type="u4" shape="1024, 32, 1" offset="264500704" size="16384" /> <output> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="5066" name="Convert_915720" type="Convert" version="opset1"> <data destination_type="f16" /> <input> <port id="0" precision="U4"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="5067" name="self.model.model.decoder.layers.23.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="5068" name="self.model.model.decoder.layers.23.fc2.weight/scale" type="Const" version="opset1"> <data element_type="f16" shape="1024, 32, 1" offset="264517088" size="65536" /> <output> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </output> </layer> <layer id="5069" name="self.model.model.decoder.layers.23.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> </output> </layer> <layer id="5070" name="Constant_915725" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="87659984" size="16" /> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="5071" name="Reshape_915726" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>32</dim> <dim>128</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="5072" name="self.model.model.decoder.layers.23.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="FP16"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </output> </layer> <layer id="5073" name="__module.model.model.decoder.layers.23.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>4096</dim> </port> <port id="1" precision="FP32"> <dim>1024</dim> <dim>4096</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5074" name="Constant_54850" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="264582624" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5075" name="__module.model.model.decoder.layers.23.fc2/aten::linear/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3103,input"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5076" name="__module.model.model.decoder.layers.23/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3105,3107"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5077" name="__module.model.model.decoder.layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="79971708" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="5078" name="__module.model.model.decoder.layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> <data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5079" name="Constant_54851" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="264586720" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5080" name="__module.model.model.decoder.layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5081" name="Constant_54852" type="Const" version="opset1"> <data element_type="f32" shape="1, 1, 1024" offset="264590816" size="4096" /> <output> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5082" name="__module.model.model.decoder.layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="3113,3115,3165"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> </output> </layer> <layer id="5083" name="__module.model.proj_out/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1024</dim> </port> <port id="1" precision="FP32"> <dim>51864</dim> <dim>1024</dim> </port> </input> <output> <port id="2" precision="FP32" names="logits"> <dim>-1</dim> <dim>-1</dim> <dim>51864</dim> </port> </output> </layer> <layer id="4964" name="Assign_59942" type="Assign" version="opset6"> <data variable_id="past_key_values.0.decoder.keypresent.0.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4963" name="Assign_59944" type="Assign" version="opset6"> <data variable_id="past_key_values.0.decoder.valuepresent.0.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4962" name="Assign_59946" type="Assign" version="opset6"> <data variable_id="past_key_values.1.decoder.keypresent.1.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4961" name="Assign_59948" type="Assign" version="opset6"> <data variable_id="past_key_values.1.decoder.valuepresent.1.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4960" name="Assign_59950" type="Assign" version="opset6"> <data variable_id="past_key_values.10.decoder.keypresent.10.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4959" name="Assign_59952" type="Assign" version="opset6"> <data variable_id="past_key_values.10.decoder.valuepresent.10.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4958" name="Assign_59954" type="Assign" version="opset6"> <data variable_id="past_key_values.11.decoder.keypresent.11.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4957" name="Assign_59956" type="Assign" version="opset6"> <data variable_id="past_key_values.11.decoder.valuepresent.11.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4956" name="Assign_59958" type="Assign" version="opset6"> <data variable_id="past_key_values.12.decoder.keypresent.12.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4955" name="Assign_59960" type="Assign" version="opset6"> <data variable_id="past_key_values.12.decoder.valuepresent.12.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4954" name="Assign_59962" type="Assign" version="opset6"> <data variable_id="past_key_values.13.decoder.keypresent.13.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4953" name="Assign_59964" type="Assign" version="opset6"> <data variable_id="past_key_values.13.decoder.valuepresent.13.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4952" name="Assign_59966" type="Assign" version="opset6"> <data variable_id="past_key_values.14.decoder.keypresent.14.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4951" name="Assign_59968" type="Assign" version="opset6"> <data variable_id="past_key_values.14.decoder.valuepresent.14.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4950" name="Assign_59970" type="Assign" version="opset6"> <data variable_id="past_key_values.15.decoder.keypresent.15.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4949" name="Assign_59972" type="Assign" version="opset6"> <data variable_id="past_key_values.15.decoder.valuepresent.15.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4948" name="Assign_59974" type="Assign" version="opset6"> <data variable_id="past_key_values.16.decoder.keypresent.16.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4947" name="Assign_59976" type="Assign" version="opset6"> <data variable_id="past_key_values.16.decoder.valuepresent.16.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4946" name="Assign_59978" type="Assign" version="opset6"> <data variable_id="past_key_values.17.decoder.keypresent.17.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4945" name="Assign_59980" type="Assign" version="opset6"> <data variable_id="past_key_values.17.decoder.valuepresent.17.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4944" name="Assign_59982" type="Assign" version="opset6"> <data variable_id="past_key_values.18.decoder.keypresent.18.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4943" name="Assign_59984" type="Assign" version="opset6"> <data variable_id="past_key_values.18.decoder.valuepresent.18.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4942" name="Assign_59986" type="Assign" version="opset6"> <data variable_id="past_key_values.19.decoder.keypresent.19.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4941" name="Assign_59988" type="Assign" version="opset6"> <data variable_id="past_key_values.19.decoder.valuepresent.19.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4940" name="Assign_59990" type="Assign" version="opset6"> <data variable_id="past_key_values.2.decoder.keypresent.2.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4939" name="Assign_59992" type="Assign" version="opset6"> <data variable_id="past_key_values.2.decoder.valuepresent.2.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4938" name="Assign_59994" type="Assign" version="opset6"> <data variable_id="past_key_values.20.decoder.keypresent.20.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4937" name="Assign_59996" type="Assign" version="opset6"> <data variable_id="past_key_values.20.decoder.valuepresent.20.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4936" name="Assign_59998" type="Assign" version="opset6"> <data variable_id="past_key_values.21.decoder.keypresent.21.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4935" name="Assign_60000" type="Assign" version="opset6"> <data variable_id="past_key_values.21.decoder.valuepresent.21.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4934" name="Assign_60002" type="Assign" version="opset6"> <data variable_id="past_key_values.22.decoder.keypresent.22.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4933" name="Assign_60004" type="Assign" version="opset6"> <data variable_id="past_key_values.22.decoder.valuepresent.22.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4932" name="Assign_60006" type="Assign" version="opset6"> <data variable_id="past_key_values.23.decoder.keypresent.23.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="4906" name="Assign_60008" type="Assign" version="opset6"> <data variable_id="past_key_values.23.decoder.valuepresent.23.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2550" name="Assign_60010" type="Assign" version="opset6"> <data variable_id="past_key_values.3.decoder.keypresent.3.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2549" name="Assign_60012" type="Assign" version="opset6"> <data variable_id="past_key_values.3.decoder.valuepresent.3.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2548" name="Assign_60014" type="Assign" version="opset6"> <data variable_id="past_key_values.4.decoder.keypresent.4.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2547" name="Assign_60016" type="Assign" version="opset6"> <data variable_id="past_key_values.4.decoder.valuepresent.4.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2546" name="Assign_60018" type="Assign" version="opset6"> <data variable_id="past_key_values.5.decoder.keypresent.5.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2545" name="Assign_60020" type="Assign" version="opset6"> <data variable_id="past_key_values.5.decoder.valuepresent.5.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2544" name="Assign_60022" type="Assign" version="opset6"> <data variable_id="past_key_values.6.decoder.keypresent.6.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2543" name="Assign_60024" type="Assign" version="opset6"> <data variable_id="past_key_values.6.decoder.valuepresent.6.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2542" name="Assign_60026" type="Assign" version="opset6"> <data variable_id="past_key_values.7.decoder.keypresent.7.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2541" name="Assign_60028" type="Assign" version="opset6"> <data variable_id="past_key_values.7.decoder.valuepresent.7.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2540" name="Assign_60030" type="Assign" version="opset6"> <data variable_id="past_key_values.8.decoder.keypresent.8.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2539" name="Assign_60032" type="Assign" version="opset6"> <data variable_id="past_key_values.8.decoder.valuepresent.8.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2538" name="Assign_60034" type="Assign" version="opset6"> <data variable_id="past_key_values.9.decoder.keypresent.9.decoder.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="2512" name="Assign_60036" type="Assign" version="opset6"> <data variable_id="past_key_values.9.decoder.valuepresent.9.decoder.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="867" name="Assign_61480" type="Assign" version="opset6"> <data variable_id="2494" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="850" name="Assign_61482" type="Assign" version="opset6"> <data variable_id="2385" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="831" name="Assign_61484" type="Assign" version="opset6"> <data variable_id="522" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="814" name="Assign_61486" type="Assign" version="opset6"> <data variable_id="1450" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="797" name="Assign_61488" type="Assign" version="opset6"> <data variable_id="2501" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="778" name="Assign_61490" type="Assign" version="opset6"> <data variable_id="2610" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="761" name="Assign_61492" type="Assign" version="opset6"> <data variable_id="638" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="744" name="Assign_61494" type="Assign" version="opset6"> <data variable_id="529" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="725" name="Assign_61496" type="Assign" version="opset6"> <data variable_id="1457" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="706" name="Assign_61498" type="Assign" version="opset6"> <data variable_id="1566" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="689" name="Assign_61500" type="Assign" version="opset6"> <data variable_id="2726" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="672" name="Assign_61502" type="Assign" version="opset6"> <data variable_id="2617" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="653" name="Assign_61504" type="Assign" version="opset6"> <data variable_id="1573" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="634" name="Assign_61506" type="Assign" version="opset6"> <data variable_id="2733" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="615" name="Assign_61508" type="Assign" version="opset6"> <data variable_id="2842" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="598" name="Assign_61510" type="Assign" version="opset6"> <data variable_id="754" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="581" name="Assign_61512" type="Assign" version="opset6"> <data variable_id="645" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="562" name="Assign_61514" type="Assign" version="opset6"> <data variable_id="1682" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="545" name="Assign_61516" type="Assign" version="opset6"> <data variable_id="2958" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="528" name="Assign_61518" type="Assign" version="opset6"> <data variable_id="870" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="511" name="Assign_61520" type="Assign" version="opset6"> <data variable_id="2849" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="492" name="Assign_61522" type="Assign" version="opset6"> <data variable_id="761" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="473" name="Assign_61524" type="Assign" version="opset6"> <data variable_id="1689" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="454" name="Assign_61526" type="Assign" version="opset6"> <data variable_id="2965" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="435" name="Assign_61528" type="Assign" version="opset6"> <data variable_id="877" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="416" name="Assign_61530" type="Assign" version="opset6"> <data variable_id="1798" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="399" name="Assign_61532" type="Assign" version="opset6"> <data variable_id="986" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="382" name="Assign_61534" type="Assign" version="opset6"> <data variable_id="1805" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="363" name="Assign_61536" type="Assign" version="opset6"> <data variable_id="993" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="344" name="Assign_61538" type="Assign" version="opset6"> <data variable_id="406" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="327" name="Assign_61540" type="Assign" version="opset6"> <data variable_id="1914" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="310" name="Assign_61542" type="Assign" version="opset6"> <data variable_id="1102" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="293" name="Assign_61544" type="Assign" version="opset6"> <data variable_id="3074" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="276" name="Assign_61546" type="Assign" version="opset6"> <data variable_id="413" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="257" name="Assign_61548" type="Assign" version="opset6"> <data variable_id="1921" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="238" name="Assign_61550" type="Assign" version="opset6"> <data variable_id="1109" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="219" name="Assign_61552" type="Assign" version="opset6"> <data variable_id="2030" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="202" name="Assign_61554" type="Assign" version="opset6"> <data variable_id="3081" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="183" name="Assign_61556" type="Assign" version="opset6"> <data variable_id="1218" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="166" name="Assign_61558" type="Assign" version="opset6"> <data variable_id="2146" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="149" name="Assign_61560" type="Assign" version="opset6"> <data variable_id="2037" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="130" name="Assign_61562" type="Assign" version="opset6"> <data variable_id="1334" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="113" name="Assign_61564" type="Assign" version="opset6"> <data variable_id="1225" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="94" name="Assign_61566" type="Assign" version="opset6"> <data variable_id="2153" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="75" name="Assign_61568" type="Assign" version="opset6"> <data variable_id="2262" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="58" name="Assign_61570" type="Assign" version="opset6"> <data variable_id="1341" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="39" name="Assign_61572" type="Assign" version="opset6"> <data variable_id="2378" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="22" name="Assign_61574" type="Assign" version="opset6"> <data variable_id="2269" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>16</dim> <dim>-1</dim> <dim>64</dim> </port> </output> </layer> <layer id="5084" name="Result_33032" type="Result" version="opset1" output_names="logits"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>51864</dim> </port> </input> </layer> </layers> <edges> <edge from-layer="0" from-port="0" to-layer="2521" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2898" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3043" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3068" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="971" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3213" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2204" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3238" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3383" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3408" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2349" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2374" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3553" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3578" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3723" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3748" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="880" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3893" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3918" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4063" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4088" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4233" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4258" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4403" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4428" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4573" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4598" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="946" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4743" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4768" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2559" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4915" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2873" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1159" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1184" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1329" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1354" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1499" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1524" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1669" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1694" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1839" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2728" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2703" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2179" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2034" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2009" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1864" to-port="1" /> <edge from-layer="1" from-port="0" to-layer="903" to-port="0" /> <edge from-layer="1" from-port="0" to-layer="1006" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="105" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="160" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="141" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="177" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="194" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="213" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="230" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="249" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="268" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="287" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="304" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="321" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="338" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="86" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="355" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="124" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="573" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="717" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="700" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="683" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="664" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="645" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="626" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="609" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="592" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="736" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="14" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="556" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="539" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="522" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="503" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="484" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="465" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="446" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="33" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="374" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="69" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="393" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="50" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="410" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="861" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="842" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="825" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="808" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="789" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="772" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="427" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="755" to-port="0" /> <edge from-layer="3" from-port="0" to-layer="869" to-port="0" /> <edge from-layer="3" from-port="0" to-layer="890" to-port="0" /> <edge from-layer="3" from-port="0" to-layer="904" to-port="0" /> <edge from-layer="4" from-port="0" to-layer="5" to-port="0" /> <edge from-layer="5" from-port="1" to-layer="8" to-port="0" /> <edge from-layer="6" from-port="0" to-layer="7" to-port="0" /> <edge from-layer="7" from-port="1" to-layer="8" to-port="1" /> <edge from-layer="8" from-port="2" to-layer="10" to-port="0" /> <edge from-layer="9" from-port="0" to-layer="10" to-port="1" /> <edge from-layer="10" from-port="2" to-layer="12" to-port="0" /> <edge from-layer="11" from-port="0" to-layer="12" to-port="1" /> <edge from-layer="12" from-port="2" to-layer="13" to-port="0" /> <edge from-layer="13" from-port="1" to-layer="14" to-port="1" /> <edge from-layer="14" from-port="2" to-layer="16" to-port="0" /> <edge from-layer="15" from-port="0" to-layer="16" to-port="1" /> <edge from-layer="16" from-port="2" to-layer="18" to-port="0" /> <edge from-layer="17" from-port="0" to-layer="18" to-port="1" /> <edge from-layer="18" from-port="2" to-layer="20" to-port="0" /> <edge from-layer="19" from-port="0" to-layer="20" to-port="1" /> <edge from-layer="20" from-port="2" to-layer="21" to-port="0" /> <edge from-layer="21" from-port="1" to-layer="22" to-port="0" /> <edge from-layer="21" from-port="1" to-layer="3809" to-port="2" /> <edge from-layer="23" from-port="0" to-layer="24" to-port="0" /> <edge from-layer="24" from-port="1" to-layer="27" to-port="0" /> <edge from-layer="25" from-port="0" to-layer="26" to-port="0" /> <edge from-layer="26" from-port="1" to-layer="27" to-port="1" /> <edge from-layer="27" from-port="2" to-layer="29" to-port="0" /> <edge from-layer="28" from-port="0" to-layer="29" to-port="1" /> <edge from-layer="29" from-port="2" to-layer="31" to-port="0" /> <edge from-layer="30" from-port="0" to-layer="31" to-port="1" /> <edge from-layer="31" from-port="2" to-layer="32" to-port="0" /> <edge from-layer="32" from-port="1" to-layer="33" to-port="1" /> <edge from-layer="33" from-port="2" to-layer="35" to-port="0" /> <edge from-layer="34" from-port="0" to-layer="35" to-port="1" /> <edge from-layer="35" from-port="2" to-layer="37" to-port="0" /> <edge from-layer="36" from-port="0" to-layer="37" to-port="1" /> <edge from-layer="37" from-port="2" to-layer="38" to-port="0" /> <edge from-layer="38" from-port="1" to-layer="39" to-port="0" /> <edge from-layer="38" from-port="1" to-layer="3979" to-port="1" /> <edge from-layer="40" from-port="0" to-layer="41" to-port="0" /> <edge from-layer="41" from-port="1" to-layer="44" to-port="0" /> <edge from-layer="42" from-port="0" to-layer="43" to-port="0" /> <edge from-layer="43" from-port="1" to-layer="44" to-port="1" /> <edge from-layer="44" from-port="2" to-layer="46" to-port="0" /> <edge from-layer="45" from-port="0" to-layer="46" to-port="1" /> <edge from-layer="46" from-port="2" to-layer="48" to-port="0" /> <edge from-layer="47" from-port="0" to-layer="48" to-port="1" /> <edge from-layer="48" from-port="2" to-layer="49" to-port="0" /> <edge from-layer="49" from-port="1" to-layer="50" to-port="1" /> <edge from-layer="50" from-port="2" to-layer="52" to-port="0" /> <edge from-layer="51" from-port="0" to-layer="52" to-port="1" /> <edge from-layer="52" from-port="2" to-layer="54" to-port="0" /> <edge from-layer="53" from-port="0" to-layer="54" to-port="1" /> <edge from-layer="54" from-port="2" to-layer="56" to-port="0" /> <edge from-layer="55" from-port="0" to-layer="56" to-port="1" /> <edge from-layer="56" from-port="2" to-layer="57" to-port="0" /> <edge from-layer="57" from-port="1" to-layer="2435" to-port="2" /> <edge from-layer="57" from-port="1" to-layer="58" to-port="0" /> <edge from-layer="59" from-port="0" to-layer="60" to-port="0" /> <edge from-layer="60" from-port="1" to-layer="63" to-port="0" /> <edge from-layer="61" from-port="0" to-layer="62" to-port="0" /> <edge from-layer="62" from-port="1" to-layer="63" to-port="1" /> <edge from-layer="63" from-port="2" to-layer="65" to-port="0" /> <edge from-layer="64" from-port="0" to-layer="65" to-port="1" /> <edge from-layer="65" from-port="2" to-layer="67" to-port="0" /> <edge from-layer="66" from-port="0" to-layer="67" to-port="1" /> <edge from-layer="67" from-port="2" to-layer="68" to-port="0" /> <edge from-layer="68" from-port="1" to-layer="69" to-port="1" /> <edge from-layer="69" from-port="2" to-layer="71" to-port="0" /> <edge from-layer="70" from-port="0" to-layer="71" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="73" to-port="0" /> <edge from-layer="72" from-port="0" to-layer="73" to-port="1" /> <edge from-layer="73" from-port="2" to-layer="74" to-port="0" /> <edge from-layer="74" from-port="1" to-layer="3809" to-port="1" /> <edge from-layer="74" from-port="1" to-layer="75" to-port="0" /> <edge from-layer="76" from-port="0" to-layer="77" to-port="0" /> <edge from-layer="77" from-port="1" to-layer="80" to-port="0" /> <edge from-layer="78" from-port="0" to-layer="79" to-port="0" /> <edge from-layer="79" from-port="1" to-layer="80" to-port="1" /> <edge from-layer="80" from-port="2" to-layer="82" to-port="0" /> <edge from-layer="81" from-port="0" to-layer="82" to-port="1" /> <edge from-layer="82" from-port="2" to-layer="84" to-port="0" /> <edge from-layer="83" from-port="0" to-layer="84" to-port="1" /> <edge from-layer="84" from-port="2" to-layer="85" to-port="0" /> <edge from-layer="85" from-port="1" to-layer="86" to-port="1" /> <edge from-layer="86" from-port="2" to-layer="88" to-port="0" /> <edge from-layer="87" from-port="0" to-layer="88" to-port="1" /> <edge from-layer="88" from-port="2" to-layer="90" to-port="0" /> <edge from-layer="89" from-port="0" to-layer="90" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="92" to-port="0" /> <edge from-layer="91" from-port="0" to-layer="92" to-port="1" /> <edge from-layer="92" from-port="2" to-layer="93" to-port="0" /> <edge from-layer="93" from-port="1" to-layer="3639" to-port="2" /> <edge from-layer="93" from-port="1" to-layer="94" to-port="0" /> <edge from-layer="95" from-port="0" to-layer="96" to-port="0" /> <edge from-layer="96" from-port="1" to-layer="99" to-port="0" /> <edge from-layer="97" from-port="0" to-layer="98" to-port="0" /> <edge from-layer="98" from-port="1" to-layer="99" to-port="1" /> <edge from-layer="99" from-port="2" to-layer="101" to-port="0" /> <edge from-layer="100" from-port="0" to-layer="101" to-port="1" /> <edge from-layer="101" from-port="2" to-layer="103" to-port="0" /> <edge from-layer="102" from-port="0" to-layer="103" to-port="1" /> <edge from-layer="103" from-port="2" to-layer="104" to-port="0" /> <edge from-layer="104" from-port="1" to-layer="105" to-port="1" /> <edge from-layer="105" from-port="2" to-layer="107" to-port="0" /> <edge from-layer="106" from-port="0" to-layer="107" to-port="1" /> <edge from-layer="107" from-port="2" to-layer="109" to-port="0" /> <edge from-layer="108" from-port="0" to-layer="109" to-port="1" /> <edge from-layer="109" from-port="2" to-layer="111" to-port="0" /> <edge from-layer="110" from-port="0" to-layer="111" to-port="1" /> <edge from-layer="111" from-port="2" to-layer="112" to-port="0" /> <edge from-layer="112" from-port="1" to-layer="2265" to-port="2" /> <edge from-layer="112" from-port="1" to-layer="113" to-port="0" /> <edge from-layer="114" from-port="0" to-layer="115" to-port="0" /> <edge from-layer="115" from-port="1" to-layer="118" to-port="0" /> <edge from-layer="116" from-port="0" to-layer="117" to-port="0" /> <edge from-layer="117" from-port="1" to-layer="118" to-port="1" /> <edge from-layer="118" from-port="2" to-layer="120" to-port="0" /> <edge from-layer="119" from-port="0" to-layer="120" to-port="1" /> <edge from-layer="120" from-port="2" to-layer="122" to-port="0" /> <edge from-layer="121" from-port="0" to-layer="122" to-port="1" /> <edge from-layer="122" from-port="2" to-layer="123" to-port="0" /> <edge from-layer="123" from-port="1" to-layer="124" to-port="1" /> <edge from-layer="124" from-port="2" to-layer="126" to-port="0" /> <edge from-layer="125" from-port="0" to-layer="126" to-port="1" /> <edge from-layer="126" from-port="2" to-layer="128" to-port="0" /> <edge from-layer="127" from-port="0" to-layer="128" to-port="1" /> <edge from-layer="128" from-port="2" to-layer="129" to-port="0" /> <edge from-layer="129" from-port="1" to-layer="2435" to-port="1" /> <edge from-layer="129" from-port="1" to-layer="130" to-port="0" /> <edge from-layer="131" from-port="0" to-layer="132" to-port="0" /> <edge from-layer="132" from-port="1" to-layer="135" to-port="0" /> <edge from-layer="133" from-port="0" to-layer="134" to-port="0" /> <edge from-layer="134" from-port="1" to-layer="135" to-port="1" /> <edge from-layer="135" from-port="2" to-layer="137" to-port="0" /> <edge from-layer="136" from-port="0" to-layer="137" to-port="1" /> <edge from-layer="137" from-port="2" to-layer="139" to-port="0" /> <edge from-layer="138" from-port="0" to-layer="139" to-port="1" /> <edge from-layer="139" from-port="2" to-layer="140" to-port="0" /> <edge from-layer="140" from-port="1" to-layer="141" to-port="1" /> <edge from-layer="141" from-port="2" to-layer="143" to-port="0" /> <edge from-layer="142" from-port="0" to-layer="143" to-port="1" /> <edge from-layer="143" from-port="2" to-layer="145" to-port="0" /> <edge from-layer="144" from-port="0" to-layer="145" to-port="1" /> <edge from-layer="145" from-port="2" to-layer="147" to-port="0" /> <edge from-layer="146" from-port="0" to-layer="147" to-port="1" /> <edge from-layer="147" from-port="2" to-layer="148" to-port="0" /> <edge from-layer="148" from-port="1" to-layer="149" to-port="0" /> <edge from-layer="148" from-port="1" to-layer="3469" to-port="2" /> <edge from-layer="150" from-port="0" to-layer="151" to-port="0" /> <edge from-layer="151" from-port="1" to-layer="154" to-port="0" /> <edge from-layer="152" from-port="0" to-layer="153" to-port="0" /> <edge from-layer="153" from-port="1" to-layer="154" to-port="1" /> <edge from-layer="154" from-port="2" to-layer="156" to-port="0" /> <edge from-layer="155" from-port="0" to-layer="156" to-port="1" /> <edge from-layer="156" from-port="2" to-layer="158" to-port="0" /> <edge from-layer="157" from-port="0" to-layer="158" to-port="1" /> <edge from-layer="158" from-port="2" to-layer="159" to-port="0" /> <edge from-layer="159" from-port="1" to-layer="160" to-port="1" /> <edge from-layer="160" from-port="2" to-layer="162" to-port="0" /> <edge from-layer="161" from-port="0" to-layer="162" to-port="1" /> <edge from-layer="162" from-port="2" to-layer="164" to-port="0" /> <edge from-layer="163" from-port="0" to-layer="164" to-port="1" /> <edge from-layer="164" from-port="2" to-layer="165" to-port="0" /> <edge from-layer="165" from-port="1" to-layer="166" to-port="0" /> <edge from-layer="165" from-port="1" to-layer="3639" to-port="1" /> <edge from-layer="167" from-port="0" to-layer="168" to-port="0" /> <edge from-layer="168" from-port="1" to-layer="171" to-port="0" /> <edge from-layer="169" from-port="0" to-layer="170" to-port="0" /> <edge from-layer="170" from-port="1" to-layer="171" to-port="1" /> <edge from-layer="171" from-port="2" to-layer="173" to-port="0" /> <edge from-layer="172" from-port="0" to-layer="173" to-port="1" /> <edge from-layer="173" from-port="2" to-layer="175" to-port="0" /> <edge from-layer="174" from-port="0" to-layer="175" to-port="1" /> <edge from-layer="175" from-port="2" to-layer="176" to-port="0" /> <edge from-layer="176" from-port="1" to-layer="177" to-port="1" /> <edge from-layer="177" from-port="2" to-layer="179" to-port="0" /> <edge from-layer="178" from-port="0" to-layer="179" to-port="1" /> <edge from-layer="179" from-port="2" to-layer="181" to-port="0" /> <edge from-layer="180" from-port="0" to-layer="181" to-port="1" /> <edge from-layer="181" from-port="2" to-layer="182" to-port="0" /> <edge from-layer="182" from-port="1" to-layer="2265" to-port="1" /> <edge from-layer="182" from-port="1" to-layer="183" to-port="0" /> <edge from-layer="184" from-port="0" to-layer="185" to-port="0" /> <edge from-layer="185" from-port="1" to-layer="188" to-port="0" /> <edge from-layer="186" from-port="0" to-layer="187" to-port="0" /> <edge from-layer="187" from-port="1" to-layer="188" to-port="1" /> <edge from-layer="188" from-port="2" to-layer="190" to-port="0" /> <edge from-layer="189" from-port="0" to-layer="190" to-port="1" /> <edge from-layer="190" from-port="2" to-layer="192" to-port="0" /> <edge from-layer="191" from-port="0" to-layer="192" to-port="1" /> <edge from-layer="192" from-port="2" to-layer="193" to-port="0" /> <edge from-layer="193" from-port="1" to-layer="194" to-port="1" /> <edge from-layer="194" from-port="2" to-layer="196" to-port="0" /> <edge from-layer="195" from-port="0" to-layer="196" to-port="1" /> <edge from-layer="196" from-port="2" to-layer="198" to-port="0" /> <edge from-layer="197" from-port="0" to-layer="198" to-port="1" /> <edge from-layer="198" from-port="2" to-layer="200" to-port="0" /> <edge from-layer="199" from-port="0" to-layer="200" to-port="1" /> <edge from-layer="200" from-port="2" to-layer="201" to-port="0" /> <edge from-layer="201" from-port="1" to-layer="202" to-port="0" /> <edge from-layer="201" from-port="1" to-layer="5024" to-port="2" /> <edge from-layer="203" from-port="0" to-layer="204" to-port="0" /> <edge from-layer="204" from-port="1" to-layer="207" to-port="0" /> <edge from-layer="205" from-port="0" to-layer="206" to-port="0" /> <edge from-layer="206" from-port="1" to-layer="207" to-port="1" /> <edge from-layer="207" from-port="2" to-layer="209" to-port="0" /> <edge from-layer="208" from-port="0" to-layer="209" to-port="1" /> <edge from-layer="209" from-port="2" to-layer="211" to-port="0" /> <edge from-layer="210" from-port="0" to-layer="211" to-port="1" /> <edge from-layer="211" from-port="2" to-layer="212" to-port="0" /> <edge from-layer="212" from-port="1" to-layer="213" to-port="1" /> <edge from-layer="213" from-port="2" to-layer="215" to-port="0" /> <edge from-layer="214" from-port="0" to-layer="215" to-port="1" /> <edge from-layer="215" from-port="2" to-layer="217" to-port="0" /> <edge from-layer="216" from-port="0" to-layer="217" to-port="1" /> <edge from-layer="217" from-port="2" to-layer="218" to-port="0" /> <edge from-layer="218" from-port="1" to-layer="3469" to-port="1" /> <edge from-layer="218" from-port="1" to-layer="219" to-port="0" /> <edge from-layer="220" from-port="0" to-layer="221" to-port="0" /> <edge from-layer="221" from-port="1" to-layer="224" to-port="0" /> <edge from-layer="222" from-port="0" to-layer="223" to-port="0" /> <edge from-layer="223" from-port="1" to-layer="224" to-port="1" /> <edge from-layer="224" from-port="2" to-layer="226" to-port="0" /> <edge from-layer="225" from-port="0" to-layer="226" to-port="1" /> <edge from-layer="226" from-port="2" to-layer="228" to-port="0" /> <edge from-layer="227" from-port="0" to-layer="228" to-port="1" /> <edge from-layer="228" from-port="2" to-layer="229" to-port="0" /> <edge from-layer="229" from-port="1" to-layer="230" to-port="1" /> <edge from-layer="230" from-port="2" to-layer="232" to-port="0" /> <edge from-layer="231" from-port="0" to-layer="232" to-port="1" /> <edge from-layer="232" from-port="2" to-layer="234" to-port="0" /> <edge from-layer="233" from-port="0" to-layer="234" to-port="1" /> <edge from-layer="234" from-port="2" to-layer="236" to-port="0" /> <edge from-layer="235" from-port="0" to-layer="236" to-port="1" /> <edge from-layer="236" from-port="2" to-layer="237" to-port="0" /> <edge from-layer="237" from-port="1" to-layer="2095" to-port="2" /> <edge from-layer="237" from-port="1" to-layer="238" to-port="0" /> <edge from-layer="239" from-port="0" to-layer="240" to-port="0" /> <edge from-layer="240" from-port="1" to-layer="243" to-port="0" /> <edge from-layer="241" from-port="0" to-layer="242" to-port="0" /> <edge from-layer="242" from-port="1" to-layer="243" to-port="1" /> <edge from-layer="243" from-port="2" to-layer="245" to-port="0" /> <edge from-layer="244" from-port="0" to-layer="245" to-port="1" /> <edge from-layer="245" from-port="2" to-layer="247" to-port="0" /> <edge from-layer="246" from-port="0" to-layer="247" to-port="1" /> <edge from-layer="247" from-port="2" to-layer="248" to-port="0" /> <edge from-layer="248" from-port="1" to-layer="249" to-port="1" /> <edge from-layer="249" from-port="2" to-layer="251" to-port="0" /> <edge from-layer="250" from-port="0" to-layer="251" to-port="1" /> <edge from-layer="251" from-port="2" to-layer="253" to-port="0" /> <edge from-layer="252" from-port="0" to-layer="253" to-port="1" /> <edge from-layer="253" from-port="2" to-layer="255" to-port="0" /> <edge from-layer="254" from-port="0" to-layer="255" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="256" to-port="0" /> <edge from-layer="256" from-port="1" to-layer="3299" to-port="2" /> <edge from-layer="256" from-port="1" to-layer="257" to-port="0" /> <edge from-layer="258" from-port="0" to-layer="259" to-port="0" /> <edge from-layer="259" from-port="1" to-layer="262" to-port="0" /> <edge from-layer="260" from-port="0" to-layer="261" to-port="0" /> <edge from-layer="261" from-port="1" to-layer="262" to-port="1" /> <edge from-layer="262" from-port="2" to-layer="264" to-port="0" /> <edge from-layer="263" from-port="0" to-layer="264" to-port="1" /> <edge from-layer="264" from-port="2" to-layer="266" to-port="0" /> <edge from-layer="265" from-port="0" to-layer="266" to-port="1" /> <edge from-layer="266" from-port="2" to-layer="267" to-port="0" /> <edge from-layer="267" from-port="1" to-layer="268" to-port="1" /> <edge from-layer="268" from-port="2" to-layer="270" to-port="0" /> <edge from-layer="269" from-port="0" to-layer="270" to-port="1" /> <edge from-layer="270" from-port="2" to-layer="272" to-port="0" /> <edge from-layer="271" from-port="0" to-layer="272" to-port="1" /> <edge from-layer="272" from-port="2" to-layer="274" to-port="0" /> <edge from-layer="273" from-port="0" to-layer="274" to-port="1" /> <edge from-layer="274" from-port="2" to-layer="275" to-port="0" /> <edge from-layer="275" from-port="1" to-layer="276" to-port="0" /> <edge from-layer="275" from-port="1" to-layer="1075" to-port="2" /> <edge from-layer="277" from-port="0" to-layer="278" to-port="0" /> <edge from-layer="278" from-port="1" to-layer="281" to-port="0" /> <edge from-layer="279" from-port="0" to-layer="280" to-port="0" /> <edge from-layer="280" from-port="1" to-layer="281" to-port="1" /> <edge from-layer="281" from-port="2" to-layer="283" to-port="0" /> <edge from-layer="282" from-port="0" to-layer="283" to-port="1" /> <edge from-layer="283" from-port="2" to-layer="285" to-port="0" /> <edge from-layer="284" from-port="0" to-layer="285" to-port="1" /> <edge from-layer="285" from-port="2" to-layer="286" to-port="0" /> <edge from-layer="286" from-port="1" to-layer="287" to-port="1" /> <edge from-layer="287" from-port="2" to-layer="289" to-port="0" /> <edge from-layer="288" from-port="0" to-layer="289" to-port="1" /> <edge from-layer="289" from-port="2" to-layer="291" to-port="0" /> <edge from-layer="290" from-port="0" to-layer="291" to-port="1" /> <edge from-layer="291" from-port="2" to-layer="292" to-port="0" /> <edge from-layer="292" from-port="1" to-layer="293" to-port="0" /> <edge from-layer="292" from-port="1" to-layer="5024" to-port="1" /> <edge from-layer="294" from-port="0" to-layer="295" to-port="0" /> <edge from-layer="295" from-port="1" to-layer="298" to-port="0" /> <edge from-layer="296" from-port="0" to-layer="297" to-port="0" /> <edge from-layer="297" from-port="1" to-layer="298" to-port="1" /> <edge from-layer="298" from-port="2" to-layer="300" to-port="0" /> <edge from-layer="299" from-port="0" to-layer="300" to-port="1" /> <edge from-layer="300" from-port="2" to-layer="302" to-port="0" /> <edge from-layer="301" from-port="0" to-layer="302" to-port="1" /> <edge from-layer="302" from-port="2" to-layer="303" to-port="0" /> <edge from-layer="303" from-port="1" to-layer="304" to-port="1" /> <edge from-layer="304" from-port="2" to-layer="306" to-port="0" /> <edge from-layer="305" from-port="0" to-layer="306" to-port="1" /> <edge from-layer="306" from-port="2" to-layer="308" to-port="0" /> <edge from-layer="307" from-port="0" to-layer="308" to-port="1" /> <edge from-layer="308" from-port="2" to-layer="309" to-port="0" /> <edge from-layer="309" from-port="1" to-layer="310" to-port="0" /> <edge from-layer="309" from-port="1" to-layer="2095" to-port="1" /> <edge from-layer="311" from-port="0" to-layer="312" to-port="0" /> <edge from-layer="312" from-port="1" to-layer="315" to-port="0" /> <edge from-layer="313" from-port="0" to-layer="314" to-port="0" /> <edge from-layer="314" from-port="1" to-layer="315" to-port="1" /> <edge from-layer="315" from-port="2" to-layer="317" to-port="0" /> <edge from-layer="316" from-port="0" to-layer="317" to-port="1" /> <edge from-layer="317" from-port="2" to-layer="319" to-port="0" /> <edge from-layer="318" from-port="0" to-layer="319" to-port="1" /> <edge from-layer="319" from-port="2" to-layer="320" to-port="0" /> <edge from-layer="320" from-port="1" to-layer="321" to-port="1" /> <edge from-layer="321" from-port="2" to-layer="323" to-port="0" /> <edge from-layer="322" from-port="0" to-layer="323" to-port="1" /> <edge from-layer="323" from-port="2" to-layer="325" to-port="0" /> <edge from-layer="324" from-port="0" to-layer="325" to-port="1" /> <edge from-layer="325" from-port="2" to-layer="326" to-port="0" /> <edge from-layer="326" from-port="1" to-layer="3299" to-port="1" /> <edge from-layer="326" from-port="1" to-layer="327" to-port="0" /> <edge from-layer="328" from-port="0" to-layer="329" to-port="0" /> <edge from-layer="329" from-port="1" to-layer="332" to-port="0" /> <edge from-layer="330" from-port="0" to-layer="331" to-port="0" /> <edge from-layer="331" from-port="1" to-layer="332" to-port="1" /> <edge from-layer="332" from-port="2" to-layer="334" to-port="0" /> <edge from-layer="333" from-port="0" to-layer="334" to-port="1" /> <edge from-layer="334" from-port="2" to-layer="336" to-port="0" /> <edge from-layer="335" from-port="0" to-layer="336" to-port="1" /> <edge from-layer="336" from-port="2" to-layer="337" to-port="0" /> <edge from-layer="337" from-port="1" to-layer="338" to-port="1" /> <edge from-layer="338" from-port="2" to-layer="340" to-port="0" /> <edge from-layer="339" from-port="0" to-layer="340" to-port="1" /> <edge from-layer="340" from-port="2" to-layer="342" to-port="0" /> <edge from-layer="341" from-port="0" to-layer="342" to-port="1" /> <edge from-layer="342" from-port="2" to-layer="343" to-port="0" /> <edge from-layer="343" from-port="1" to-layer="1075" to-port="1" /> <edge from-layer="343" from-port="1" to-layer="344" to-port="0" /> <edge from-layer="345" from-port="0" to-layer="346" to-port="0" /> <edge from-layer="346" from-port="1" to-layer="349" to-port="0" /> <edge from-layer="347" from-port="0" to-layer="348" to-port="0" /> <edge from-layer="348" from-port="1" to-layer="349" to-port="1" /> <edge from-layer="349" from-port="2" to-layer="351" to-port="0" /> <edge from-layer="350" from-port="0" to-layer="351" to-port="1" /> <edge from-layer="351" from-port="2" to-layer="353" to-port="0" /> <edge from-layer="352" from-port="0" to-layer="353" to-port="1" /> <edge from-layer="353" from-port="2" to-layer="354" to-port="0" /> <edge from-layer="354" from-port="1" to-layer="355" to-port="1" /> <edge from-layer="355" from-port="2" to-layer="357" to-port="0" /> <edge from-layer="356" from-port="0" to-layer="357" to-port="1" /> <edge from-layer="357" from-port="2" to-layer="359" to-port="0" /> <edge from-layer="358" from-port="0" to-layer="359" to-port="1" /> <edge from-layer="359" from-port="2" to-layer="361" to-port="0" /> <edge from-layer="360" from-port="0" to-layer="361" to-port="1" /> <edge from-layer="361" from-port="2" to-layer="362" to-port="0" /> <edge from-layer="362" from-port="1" to-layer="1925" to-port="2" /> <edge from-layer="362" from-port="1" to-layer="363" to-port="0" /> <edge from-layer="364" from-port="0" to-layer="365" to-port="0" /> <edge from-layer="365" from-port="1" to-layer="368" to-port="0" /> <edge from-layer="366" from-port="0" to-layer="367" to-port="0" /> <edge from-layer="367" from-port="1" to-layer="368" to-port="1" /> <edge from-layer="368" from-port="2" to-layer="370" to-port="0" /> <edge from-layer="369" from-port="0" to-layer="370" to-port="1" /> <edge from-layer="370" from-port="2" to-layer="372" to-port="0" /> <edge from-layer="371" from-port="0" to-layer="372" to-port="1" /> <edge from-layer="372" from-port="2" to-layer="373" to-port="0" /> <edge from-layer="373" from-port="1" to-layer="374" to-port="1" /> <edge from-layer="374" from-port="2" to-layer="376" to-port="0" /> <edge from-layer="375" from-port="0" to-layer="376" to-port="1" /> <edge from-layer="376" from-port="2" to-layer="378" to-port="0" /> <edge from-layer="377" from-port="0" to-layer="378" to-port="1" /> <edge from-layer="378" from-port="2" to-layer="380" to-port="0" /> <edge from-layer="379" from-port="0" to-layer="380" to-port="1" /> <edge from-layer="380" from-port="2" to-layer="381" to-port="0" /> <edge from-layer="381" from-port="1" to-layer="3129" to-port="2" /> <edge from-layer="381" from-port="1" to-layer="382" to-port="0" /> <edge from-layer="383" from-port="0" to-layer="384" to-port="0" /> <edge from-layer="384" from-port="1" to-layer="387" to-port="0" /> <edge from-layer="385" from-port="0" to-layer="386" to-port="0" /> <edge from-layer="386" from-port="1" to-layer="387" to-port="1" /> <edge from-layer="387" from-port="2" to-layer="389" to-port="0" /> <edge from-layer="388" from-port="0" to-layer="389" to-port="1" /> <edge from-layer="389" from-port="2" to-layer="391" to-port="0" /> <edge from-layer="390" from-port="0" to-layer="391" to-port="1" /> <edge from-layer="391" from-port="2" to-layer="392" to-port="0" /> <edge from-layer="392" from-port="1" to-layer="393" to-port="1" /> <edge from-layer="393" from-port="2" to-layer="395" to-port="0" /> <edge from-layer="394" from-port="0" to-layer="395" to-port="1" /> <edge from-layer="395" from-port="2" to-layer="397" to-port="0" /> <edge from-layer="396" from-port="0" to-layer="397" to-port="1" /> <edge from-layer="397" from-port="2" to-layer="398" to-port="0" /> <edge from-layer="398" from-port="1" to-layer="1925" to-port="1" /> <edge from-layer="398" from-port="1" to-layer="399" to-port="0" /> <edge from-layer="400" from-port="0" to-layer="401" to-port="0" /> <edge from-layer="401" from-port="1" to-layer="404" to-port="0" /> <edge from-layer="402" from-port="0" to-layer="403" to-port="0" /> <edge from-layer="403" from-port="1" to-layer="404" to-port="1" /> <edge from-layer="404" from-port="2" to-layer="406" to-port="0" /> <edge from-layer="405" from-port="0" to-layer="406" to-port="1" /> <edge from-layer="406" from-port="2" to-layer="408" to-port="0" /> <edge from-layer="407" from-port="0" to-layer="408" to-port="1" /> <edge from-layer="408" from-port="2" to-layer="409" to-port="0" /> <edge from-layer="409" from-port="1" to-layer="410" to-port="1" /> <edge from-layer="410" from-port="2" to-layer="412" to-port="0" /> <edge from-layer="411" from-port="0" to-layer="412" to-port="1" /> <edge from-layer="412" from-port="2" to-layer="414" to-port="0" /> <edge from-layer="413" from-port="0" to-layer="414" to-port="1" /> <edge from-layer="414" from-port="2" to-layer="415" to-port="0" /> <edge from-layer="415" from-port="1" to-layer="416" to-port="0" /> <edge from-layer="415" from-port="1" to-layer="3129" to-port="1" /> <edge from-layer="417" from-port="0" to-layer="418" to-port="0" /> <edge from-layer="418" from-port="1" to-layer="421" to-port="0" /> <edge from-layer="419" from-port="0" to-layer="420" to-port="0" /> <edge from-layer="420" from-port="1" to-layer="421" to-port="1" /> <edge from-layer="421" from-port="2" to-layer="423" to-port="0" /> <edge from-layer="422" from-port="0" to-layer="423" to-port="1" /> <edge from-layer="423" from-port="2" to-layer="425" to-port="0" /> <edge from-layer="424" from-port="0" to-layer="425" to-port="1" /> <edge from-layer="425" from-port="2" to-layer="426" to-port="0" /> <edge from-layer="426" from-port="1" to-layer="427" to-port="1" /> <edge from-layer="427" from-port="2" to-layer="429" to-port="0" /> <edge from-layer="428" from-port="0" to-layer="429" to-port="1" /> <edge from-layer="429" from-port="2" to-layer="431" to-port="0" /> <edge from-layer="430" from-port="0" to-layer="431" to-port="1" /> <edge from-layer="431" from-port="2" to-layer="433" to-port="0" /> <edge from-layer="432" from-port="0" to-layer="433" to-port="1" /> <edge from-layer="433" from-port="2" to-layer="434" to-port="0" /> <edge from-layer="434" from-port="1" to-layer="1755" to-port="2" /> <edge from-layer="434" from-port="1" to-layer="435" to-port="0" /> <edge from-layer="436" from-port="0" to-layer="437" to-port="0" /> <edge from-layer="437" from-port="1" to-layer="440" to-port="0" /> <edge from-layer="438" from-port="0" to-layer="439" to-port="0" /> <edge from-layer="439" from-port="1" to-layer="440" to-port="1" /> <edge from-layer="440" from-port="2" to-layer="442" to-port="0" /> <edge from-layer="441" from-port="0" to-layer="442" to-port="1" /> <edge from-layer="442" from-port="2" to-layer="444" to-port="0" /> <edge from-layer="443" from-port="0" to-layer="444" to-port="1" /> <edge from-layer="444" from-port="2" to-layer="445" to-port="0" /> <edge from-layer="445" from-port="1" to-layer="446" to-port="1" /> <edge from-layer="446" from-port="2" to-layer="448" to-port="0" /> <edge from-layer="447" from-port="0" to-layer="448" to-port="1" /> <edge from-layer="448" from-port="2" to-layer="450" to-port="0" /> <edge from-layer="449" from-port="0" to-layer="450" to-port="1" /> <edge from-layer="450" from-port="2" to-layer="452" to-port="0" /> <edge from-layer="451" from-port="0" to-layer="452" to-port="1" /> <edge from-layer="452" from-port="2" to-layer="453" to-port="0" /> <edge from-layer="453" from-port="1" to-layer="454" to-port="0" /> <edge from-layer="453" from-port="1" to-layer="4829" to-port="2" /> <edge from-layer="455" from-port="0" to-layer="456" to-port="0" /> <edge from-layer="456" from-port="1" to-layer="459" to-port="0" /> <edge from-layer="457" from-port="0" to-layer="458" to-port="0" /> <edge from-layer="458" from-port="1" to-layer="459" to-port="1" /> <edge from-layer="459" from-port="2" to-layer="461" to-port="0" /> <edge from-layer="460" from-port="0" to-layer="461" to-port="1" /> <edge from-layer="461" from-port="2" to-layer="463" to-port="0" /> <edge from-layer="462" from-port="0" to-layer="463" to-port="1" /> <edge from-layer="463" from-port="2" to-layer="464" to-port="0" /> <edge from-layer="464" from-port="1" to-layer="465" to-port="1" /> <edge from-layer="465" from-port="2" to-layer="467" to-port="0" /> <edge from-layer="466" from-port="0" to-layer="467" to-port="1" /> <edge from-layer="467" from-port="2" to-layer="469" to-port="0" /> <edge from-layer="468" from-port="0" to-layer="469" to-port="1" /> <edge from-layer="469" from-port="2" to-layer="471" to-port="0" /> <edge from-layer="470" from-port="0" to-layer="471" to-port="1" /> <edge from-layer="471" from-port="2" to-layer="472" to-port="0" /> <edge from-layer="472" from-port="1" to-layer="2959" to-port="2" /> <edge from-layer="472" from-port="1" to-layer="473" to-port="0" /> <edge from-layer="474" from-port="0" to-layer="475" to-port="0" /> <edge from-layer="475" from-port="1" to-layer="478" to-port="0" /> <edge from-layer="476" from-port="0" to-layer="477" to-port="0" /> <edge from-layer="477" from-port="1" to-layer="478" to-port="1" /> <edge from-layer="478" from-port="2" to-layer="480" to-port="0" /> <edge from-layer="479" from-port="0" to-layer="480" to-port="1" /> <edge from-layer="480" from-port="2" to-layer="482" to-port="0" /> <edge from-layer="481" from-port="0" to-layer="482" to-port="1" /> <edge from-layer="482" from-port="2" to-layer="483" to-port="0" /> <edge from-layer="483" from-port="1" to-layer="484" to-port="1" /> <edge from-layer="484" from-port="2" to-layer="486" to-port="0" /> <edge from-layer="485" from-port="0" to-layer="486" to-port="1" /> <edge from-layer="486" from-port="2" to-layer="488" to-port="0" /> <edge from-layer="487" from-port="0" to-layer="488" to-port="1" /> <edge from-layer="488" from-port="2" to-layer="490" to-port="0" /> <edge from-layer="489" from-port="0" to-layer="490" to-port="1" /> <edge from-layer="490" from-port="2" to-layer="491" to-port="0" /> <edge from-layer="491" from-port="1" to-layer="1585" to-port="2" /> <edge from-layer="491" from-port="1" to-layer="492" to-port="0" /> <edge from-layer="493" from-port="0" to-layer="494" to-port="0" /> <edge from-layer="494" from-port="1" to-layer="497" to-port="0" /> <edge from-layer="495" from-port="0" to-layer="496" to-port="0" /> <edge from-layer="496" from-port="1" to-layer="497" to-port="1" /> <edge from-layer="497" from-port="2" to-layer="499" to-port="0" /> <edge from-layer="498" from-port="0" to-layer="499" to-port="1" /> <edge from-layer="499" from-port="2" to-layer="501" to-port="0" /> <edge from-layer="500" from-port="0" to-layer="501" to-port="1" /> <edge from-layer="501" from-port="2" to-layer="502" to-port="0" /> <edge from-layer="502" from-port="1" to-layer="503" to-port="1" /> <edge from-layer="503" from-port="2" to-layer="505" to-port="0" /> <edge from-layer="504" from-port="0" to-layer="505" to-port="1" /> <edge from-layer="505" from-port="2" to-layer="507" to-port="0" /> <edge from-layer="506" from-port="0" to-layer="507" to-port="1" /> <edge from-layer="507" from-port="2" to-layer="509" to-port="0" /> <edge from-layer="508" from-port="0" to-layer="509" to-port="1" /> <edge from-layer="509" from-port="2" to-layer="510" to-port="0" /> <edge from-layer="510" from-port="1" to-layer="511" to-port="0" /> <edge from-layer="510" from-port="1" to-layer="4659" to-port="2" /> <edge from-layer="512" from-port="0" to-layer="513" to-port="0" /> <edge from-layer="513" from-port="1" to-layer="516" to-port="0" /> <edge from-layer="514" from-port="0" to-layer="515" to-port="0" /> <edge from-layer="515" from-port="1" to-layer="516" to-port="1" /> <edge from-layer="516" from-port="2" to-layer="518" to-port="0" /> <edge from-layer="517" from-port="0" to-layer="518" to-port="1" /> <edge from-layer="518" from-port="2" to-layer="520" to-port="0" /> <edge from-layer="519" from-port="0" to-layer="520" to-port="1" /> <edge from-layer="520" from-port="2" to-layer="521" to-port="0" /> <edge from-layer="521" from-port="1" to-layer="522" to-port="1" /> <edge from-layer="522" from-port="2" to-layer="524" to-port="0" /> <edge from-layer="523" from-port="0" to-layer="524" to-port="1" /> <edge from-layer="524" from-port="2" to-layer="526" to-port="0" /> <edge from-layer="525" from-port="0" to-layer="526" to-port="1" /> <edge from-layer="526" from-port="2" to-layer="527" to-port="0" /> <edge from-layer="527" from-port="1" to-layer="528" to-port="0" /> <edge from-layer="527" from-port="1" to-layer="1755" to-port="1" /> <edge from-layer="529" from-port="0" to-layer="530" to-port="0" /> <edge from-layer="530" from-port="1" to-layer="533" to-port="0" /> <edge from-layer="531" from-port="0" to-layer="532" to-port="0" /> <edge from-layer="532" from-port="1" to-layer="533" to-port="1" /> <edge from-layer="533" from-port="2" to-layer="535" to-port="0" /> <edge from-layer="534" from-port="0" to-layer="535" to-port="1" /> <edge from-layer="535" from-port="2" to-layer="537" to-port="0" /> <edge from-layer="536" from-port="0" to-layer="537" to-port="1" /> <edge from-layer="537" from-port="2" to-layer="538" to-port="0" /> <edge from-layer="538" from-port="1" to-layer="539" to-port="1" /> <edge from-layer="539" from-port="2" to-layer="541" to-port="0" /> <edge from-layer="540" from-port="0" to-layer="541" to-port="1" /> <edge from-layer="541" from-port="2" to-layer="543" to-port="0" /> <edge from-layer="542" from-port="0" to-layer="543" to-port="1" /> <edge from-layer="543" from-port="2" to-layer="544" to-port="0" /> <edge from-layer="544" from-port="1" to-layer="545" to-port="0" /> <edge from-layer="544" from-port="1" to-layer="4829" to-port="1" /> <edge from-layer="546" from-port="0" to-layer="547" to-port="0" /> <edge from-layer="547" from-port="1" to-layer="550" to-port="0" /> <edge from-layer="548" from-port="0" to-layer="549" to-port="0" /> <edge from-layer="549" from-port="1" to-layer="550" to-port="1" /> <edge from-layer="550" from-port="2" to-layer="552" to-port="0" /> <edge from-layer="551" from-port="0" to-layer="552" to-port="1" /> <edge from-layer="552" from-port="2" to-layer="554" to-port="0" /> <edge from-layer="553" from-port="0" to-layer="554" to-port="1" /> <edge from-layer="554" from-port="2" to-layer="555" to-port="0" /> <edge from-layer="555" from-port="1" to-layer="556" to-port="1" /> <edge from-layer="556" from-port="2" to-layer="558" to-port="0" /> <edge from-layer="557" from-port="0" to-layer="558" to-port="1" /> <edge from-layer="558" from-port="2" to-layer="560" to-port="0" /> <edge from-layer="559" from-port="0" to-layer="560" to-port="1" /> <edge from-layer="560" from-port="2" to-layer="561" to-port="0" /> <edge from-layer="561" from-port="1" to-layer="2959" to-port="1" /> <edge from-layer="561" from-port="1" to-layer="562" to-port="0" /> <edge from-layer="563" from-port="0" to-layer="564" to-port="0" /> <edge from-layer="564" from-port="1" to-layer="567" to-port="0" /> <edge from-layer="565" from-port="0" to-layer="566" to-port="0" /> <edge from-layer="566" from-port="1" to-layer="567" to-port="1" /> <edge from-layer="567" from-port="2" to-layer="569" to-port="0" /> <edge from-layer="568" from-port="0" to-layer="569" to-port="1" /> <edge from-layer="569" from-port="2" to-layer="571" to-port="0" /> <edge from-layer="570" from-port="0" to-layer="571" to-port="1" /> <edge from-layer="571" from-port="2" to-layer="572" to-port="0" /> <edge from-layer="572" from-port="1" to-layer="573" to-port="1" /> <edge from-layer="573" from-port="2" to-layer="575" to-port="0" /> <edge from-layer="574" from-port="0" to-layer="575" to-port="1" /> <edge from-layer="575" from-port="2" to-layer="577" to-port="0" /> <edge from-layer="576" from-port="0" to-layer="577" to-port="1" /> <edge from-layer="577" from-port="2" to-layer="579" to-port="0" /> <edge from-layer="578" from-port="0" to-layer="579" to-port="1" /> <edge from-layer="579" from-port="2" to-layer="580" to-port="0" /> <edge from-layer="580" from-port="1" to-layer="581" to-port="0" /> <edge from-layer="580" from-port="1" to-layer="1415" to-port="2" /> <edge from-layer="582" from-port="0" to-layer="583" to-port="0" /> <edge from-layer="583" from-port="1" to-layer="586" to-port="0" /> <edge from-layer="584" from-port="0" to-layer="585" to-port="0" /> <edge from-layer="585" from-port="1" to-layer="586" to-port="1" /> <edge from-layer="586" from-port="2" to-layer="588" to-port="0" /> <edge from-layer="587" from-port="0" to-layer="588" to-port="1" /> <edge from-layer="588" from-port="2" to-layer="590" to-port="0" /> <edge from-layer="589" from-port="0" to-layer="590" to-port="1" /> <edge from-layer="590" from-port="2" to-layer="591" to-port="0" /> <edge from-layer="591" from-port="1" to-layer="592" to-port="1" /> <edge from-layer="592" from-port="2" to-layer="594" to-port="0" /> <edge from-layer="593" from-port="0" to-layer="594" to-port="1" /> <edge from-layer="594" from-port="2" to-layer="596" to-port="0" /> <edge from-layer="595" from-port="0" to-layer="596" to-port="1" /> <edge from-layer="596" from-port="2" to-layer="597" to-port="0" /> <edge from-layer="597" from-port="1" to-layer="1585" to-port="1" /> <edge from-layer="597" from-port="1" to-layer="598" to-port="0" /> <edge from-layer="599" from-port="0" to-layer="600" to-port="0" /> <edge from-layer="600" from-port="1" to-layer="603" to-port="0" /> <edge from-layer="601" from-port="0" to-layer="602" to-port="0" /> <edge from-layer="602" from-port="1" to-layer="603" to-port="1" /> <edge from-layer="603" from-port="2" to-layer="605" to-port="0" /> <edge from-layer="604" from-port="0" to-layer="605" to-port="1" /> <edge from-layer="605" from-port="2" to-layer="607" to-port="0" /> <edge from-layer="606" from-port="0" to-layer="607" to-port="1" /> <edge from-layer="607" from-port="2" to-layer="608" to-port="0" /> <edge from-layer="608" from-port="1" to-layer="609" to-port="1" /> <edge from-layer="609" from-port="2" to-layer="611" to-port="0" /> <edge from-layer="610" from-port="0" to-layer="611" to-port="1" /> <edge from-layer="611" from-port="2" to-layer="613" to-port="0" /> <edge from-layer="612" from-port="0" to-layer="613" to-port="1" /> <edge from-layer="613" from-port="2" to-layer="614" to-port="0" /> <edge from-layer="614" from-port="1" to-layer="4659" to-port="1" /> <edge from-layer="614" from-port="1" to-layer="615" to-port="0" /> <edge from-layer="616" from-port="0" to-layer="617" to-port="0" /> <edge from-layer="617" from-port="1" to-layer="620" to-port="0" /> <edge from-layer="618" from-port="0" to-layer="619" to-port="0" /> <edge from-layer="619" from-port="1" to-layer="620" to-port="1" /> <edge from-layer="620" from-port="2" to-layer="622" to-port="0" /> <edge from-layer="621" from-port="0" to-layer="622" to-port="1" /> <edge from-layer="622" from-port="2" to-layer="624" to-port="0" /> <edge from-layer="623" from-port="0" to-layer="624" to-port="1" /> <edge from-layer="624" from-port="2" to-layer="625" to-port="0" /> <edge from-layer="625" from-port="1" to-layer="626" to-port="1" /> <edge from-layer="626" from-port="2" to-layer="628" to-port="0" /> <edge from-layer="627" from-port="0" to-layer="628" to-port="1" /> <edge from-layer="628" from-port="2" to-layer="630" to-port="0" /> <edge from-layer="629" from-port="0" to-layer="630" to-port="1" /> <edge from-layer="630" from-port="2" to-layer="632" to-port="0" /> <edge from-layer="631" from-port="0" to-layer="632" to-port="1" /> <edge from-layer="632" from-port="2" to-layer="633" to-port="0" /> <edge from-layer="633" from-port="1" to-layer="634" to-port="0" /> <edge from-layer="633" from-port="1" to-layer="4489" to-port="2" /> <edge from-layer="635" from-port="0" to-layer="636" to-port="0" /> <edge from-layer="636" from-port="1" to-layer="639" to-port="0" /> <edge from-layer="637" from-port="0" to-layer="638" to-port="0" /> <edge from-layer="638" from-port="1" to-layer="639" to-port="1" /> <edge from-layer="639" from-port="2" to-layer="641" to-port="0" /> <edge from-layer="640" from-port="0" to-layer="641" to-port="1" /> <edge from-layer="641" from-port="2" to-layer="643" to-port="0" /> <edge from-layer="642" from-port="0" to-layer="643" to-port="1" /> <edge from-layer="643" from-port="2" to-layer="644" to-port="0" /> <edge from-layer="644" from-port="1" to-layer="645" to-port="1" /> <edge from-layer="645" from-port="2" to-layer="647" to-port="0" /> <edge from-layer="646" from-port="0" to-layer="647" to-port="1" /> <edge from-layer="647" from-port="2" to-layer="649" to-port="0" /> <edge from-layer="648" from-port="0" to-layer="649" to-port="1" /> <edge from-layer="649" from-port="2" to-layer="651" to-port="0" /> <edge from-layer="650" from-port="0" to-layer="651" to-port="1" /> <edge from-layer="651" from-port="2" to-layer="652" to-port="0" /> <edge from-layer="652" from-port="1" to-layer="2789" to-port="2" /> <edge from-layer="652" from-port="1" to-layer="653" to-port="0" /> <edge from-layer="654" from-port="0" to-layer="655" to-port="0" /> <edge from-layer="655" from-port="1" to-layer="658" to-port="0" /> <edge from-layer="656" from-port="0" to-layer="657" to-port="0" /> <edge from-layer="657" from-port="1" to-layer="658" to-port="1" /> <edge from-layer="658" from-port="2" to-layer="660" to-port="0" /> <edge from-layer="659" from-port="0" to-layer="660" to-port="1" /> <edge from-layer="660" from-port="2" to-layer="662" to-port="0" /> <edge from-layer="661" from-port="0" to-layer="662" to-port="1" /> <edge from-layer="662" from-port="2" to-layer="663" to-port="0" /> <edge from-layer="663" from-port="1" to-layer="664" to-port="1" /> <edge from-layer="664" from-port="2" to-layer="666" to-port="0" /> <edge from-layer="665" from-port="0" to-layer="666" to-port="1" /> <edge from-layer="666" from-port="2" to-layer="668" to-port="0" /> <edge from-layer="667" from-port="0" to-layer="668" to-port="1" /> <edge from-layer="668" from-port="2" to-layer="670" to-port="0" /> <edge from-layer="669" from-port="0" to-layer="670" to-port="1" /> <edge from-layer="670" from-port="2" to-layer="671" to-port="0" /> <edge from-layer="671" from-port="1" to-layer="672" to-port="0" /> <edge from-layer="671" from-port="1" to-layer="4319" to-port="2" /> <edge from-layer="673" from-port="0" to-layer="674" to-port="0" /> <edge from-layer="674" from-port="1" to-layer="677" to-port="0" /> <edge from-layer="675" from-port="0" to-layer="676" to-port="0" /> <edge from-layer="676" from-port="1" to-layer="677" to-port="1" /> <edge from-layer="677" from-port="2" to-layer="679" to-port="0" /> <edge from-layer="678" from-port="0" to-layer="679" to-port="1" /> <edge from-layer="679" from-port="2" to-layer="681" to-port="0" /> <edge from-layer="680" from-port="0" to-layer="681" to-port="1" /> <edge from-layer="681" from-port="2" to-layer="682" to-port="0" /> <edge from-layer="682" from-port="1" to-layer="683" to-port="1" /> <edge from-layer="683" from-port="2" to-layer="685" to-port="0" /> <edge from-layer="684" from-port="0" to-layer="685" to-port="1" /> <edge from-layer="685" from-port="2" to-layer="687" to-port="0" /> <edge from-layer="686" from-port="0" to-layer="687" to-port="1" /> <edge from-layer="687" from-port="2" to-layer="688" to-port="0" /> <edge from-layer="688" from-port="1" to-layer="689" to-port="0" /> <edge from-layer="688" from-port="1" to-layer="4489" to-port="1" /> <edge from-layer="690" from-port="0" to-layer="691" to-port="0" /> <edge from-layer="691" from-port="1" to-layer="694" to-port="0" /> <edge from-layer="692" from-port="0" to-layer="693" to-port="0" /> <edge from-layer="693" from-port="1" to-layer="694" to-port="1" /> <edge from-layer="694" from-port="2" to-layer="696" to-port="0" /> <edge from-layer="695" from-port="0" to-layer="696" to-port="1" /> <edge from-layer="696" from-port="2" to-layer="698" to-port="0" /> <edge from-layer="697" from-port="0" to-layer="698" to-port="1" /> <edge from-layer="698" from-port="2" to-layer="699" to-port="0" /> <edge from-layer="699" from-port="1" to-layer="700" to-port="1" /> <edge from-layer="700" from-port="2" to-layer="702" to-port="0" /> <edge from-layer="701" from-port="0" to-layer="702" to-port="1" /> <edge from-layer="702" from-port="2" to-layer="704" to-port="0" /> <edge from-layer="703" from-port="0" to-layer="704" to-port="1" /> <edge from-layer="704" from-port="2" to-layer="705" to-port="0" /> <edge from-layer="705" from-port="1" to-layer="2789" to-port="1" /> <edge from-layer="705" from-port="1" to-layer="706" to-port="0" /> <edge from-layer="707" from-port="0" to-layer="708" to-port="0" /> <edge from-layer="708" from-port="1" to-layer="711" to-port="0" /> <edge from-layer="709" from-port="0" to-layer="710" to-port="0" /> <edge from-layer="710" from-port="1" to-layer="711" to-port="1" /> <edge from-layer="711" from-port="2" to-layer="713" to-port="0" /> <edge from-layer="712" from-port="0" to-layer="713" to-port="1" /> <edge from-layer="713" from-port="2" to-layer="715" to-port="0" /> <edge from-layer="714" from-port="0" to-layer="715" to-port="1" /> <edge from-layer="715" from-port="2" to-layer="716" to-port="0" /> <edge from-layer="716" from-port="1" to-layer="717" to-port="1" /> <edge from-layer="717" from-port="2" to-layer="719" to-port="0" /> <edge from-layer="718" from-port="0" to-layer="719" to-port="1" /> <edge from-layer="719" from-port="2" to-layer="721" to-port="0" /> <edge from-layer="720" from-port="0" to-layer="721" to-port="1" /> <edge from-layer="721" from-port="2" to-layer="723" to-port="0" /> <edge from-layer="722" from-port="0" to-layer="723" to-port="1" /> <edge from-layer="723" from-port="2" to-layer="724" to-port="0" /> <edge from-layer="724" from-port="1" to-layer="725" to-port="0" /> <edge from-layer="724" from-port="1" to-layer="2619" to-port="2" /> <edge from-layer="726" from-port="0" to-layer="727" to-port="0" /> <edge from-layer="727" from-port="1" to-layer="730" to-port="0" /> <edge from-layer="728" from-port="0" to-layer="729" to-port="0" /> <edge from-layer="729" from-port="1" to-layer="730" to-port="1" /> <edge from-layer="730" from-port="2" to-layer="732" to-port="0" /> <edge from-layer="731" from-port="0" to-layer="732" to-port="1" /> <edge from-layer="732" from-port="2" to-layer="734" to-port="0" /> <edge from-layer="733" from-port="0" to-layer="734" to-port="1" /> <edge from-layer="734" from-port="2" to-layer="735" to-port="0" /> <edge from-layer="735" from-port="1" to-layer="736" to-port="1" /> <edge from-layer="736" from-port="2" to-layer="738" to-port="0" /> <edge from-layer="737" from-port="0" to-layer="738" to-port="1" /> <edge from-layer="738" from-port="2" to-layer="740" to-port="0" /> <edge from-layer="739" from-port="0" to-layer="740" to-port="1" /> <edge from-layer="740" from-port="2" to-layer="742" to-port="0" /> <edge from-layer="741" from-port="0" to-layer="742" to-port="1" /> <edge from-layer="742" from-port="2" to-layer="743" to-port="0" /> <edge from-layer="743" from-port="1" to-layer="744" to-port="0" /> <edge from-layer="743" from-port="1" to-layer="1245" to-port="2" /> <edge from-layer="745" from-port="0" to-layer="746" to-port="0" /> <edge from-layer="746" from-port="1" to-layer="749" to-port="0" /> <edge from-layer="747" from-port="0" to-layer="748" to-port="0" /> <edge from-layer="748" from-port="1" to-layer="749" to-port="1" /> <edge from-layer="749" from-port="2" to-layer="751" to-port="0" /> <edge from-layer="750" from-port="0" to-layer="751" to-port="1" /> <edge from-layer="751" from-port="2" to-layer="753" to-port="0" /> <edge from-layer="752" from-port="0" to-layer="753" to-port="1" /> <edge from-layer="753" from-port="2" to-layer="754" to-port="0" /> <edge from-layer="754" from-port="1" to-layer="755" to-port="1" /> <edge from-layer="755" from-port="2" to-layer="757" to-port="0" /> <edge from-layer="756" from-port="0" to-layer="757" to-port="1" /> <edge from-layer="757" from-port="2" to-layer="759" to-port="0" /> <edge from-layer="758" from-port="0" to-layer="759" to-port="1" /> <edge from-layer="759" from-port="2" to-layer="760" to-port="0" /> <edge from-layer="760" from-port="1" to-layer="1415" to-port="1" /> <edge from-layer="760" from-port="1" to-layer="761" to-port="0" /> <edge from-layer="762" from-port="0" to-layer="763" to-port="0" /> <edge from-layer="763" from-port="1" to-layer="766" to-port="0" /> <edge from-layer="764" from-port="0" to-layer="765" to-port="0" /> <edge from-layer="765" from-port="1" to-layer="766" to-port="1" /> <edge from-layer="766" from-port="2" to-layer="768" to-port="0" /> <edge from-layer="767" from-port="0" to-layer="768" to-port="1" /> <edge from-layer="768" from-port="2" to-layer="770" to-port="0" /> <edge from-layer="769" from-port="0" to-layer="770" to-port="1" /> <edge from-layer="770" from-port="2" to-layer="771" to-port="0" /> <edge from-layer="771" from-port="1" to-layer="772" to-port="1" /> <edge from-layer="772" from-port="2" to-layer="774" to-port="0" /> <edge from-layer="773" from-port="0" to-layer="774" to-port="1" /> <edge from-layer="774" from-port="2" to-layer="776" to-port="0" /> <edge from-layer="775" from-port="0" to-layer="776" to-port="1" /> <edge from-layer="776" from-port="2" to-layer="777" to-port="0" /> <edge from-layer="777" from-port="1" to-layer="778" to-port="0" /> <edge from-layer="777" from-port="1" to-layer="4319" to-port="1" /> <edge from-layer="779" from-port="0" to-layer="780" to-port="0" /> <edge from-layer="780" from-port="1" to-layer="783" to-port="0" /> <edge from-layer="781" from-port="0" to-layer="782" to-port="0" /> <edge from-layer="782" from-port="1" to-layer="783" to-port="1" /> <edge from-layer="783" from-port="2" to-layer="785" to-port="0" /> <edge from-layer="784" from-port="0" to-layer="785" to-port="1" /> <edge from-layer="785" from-port="2" to-layer="787" to-port="0" /> <edge from-layer="786" from-port="0" to-layer="787" to-port="1" /> <edge from-layer="787" from-port="2" to-layer="788" to-port="0" /> <edge from-layer="788" from-port="1" to-layer="789" to-port="1" /> <edge from-layer="789" from-port="2" to-layer="791" to-port="0" /> <edge from-layer="790" from-port="0" to-layer="791" to-port="1" /> <edge from-layer="791" from-port="2" to-layer="793" to-port="0" /> <edge from-layer="792" from-port="0" to-layer="793" to-port="1" /> <edge from-layer="793" from-port="2" to-layer="795" to-port="0" /> <edge from-layer="794" from-port="0" to-layer="795" to-port="1" /> <edge from-layer="795" from-port="2" to-layer="796" to-port="0" /> <edge from-layer="796" from-port="1" to-layer="797" to-port="0" /> <edge from-layer="796" from-port="1" to-layer="4149" to-port="2" /> <edge from-layer="798" from-port="0" to-layer="799" to-port="0" /> <edge from-layer="799" from-port="1" to-layer="802" to-port="0" /> <edge from-layer="800" from-port="0" to-layer="801" to-port="0" /> <edge from-layer="801" from-port="1" to-layer="802" to-port="1" /> <edge from-layer="802" from-port="2" to-layer="804" to-port="0" /> <edge from-layer="803" from-port="0" to-layer="804" to-port="1" /> <edge from-layer="804" from-port="2" to-layer="806" to-port="0" /> <edge from-layer="805" from-port="0" to-layer="806" to-port="1" /> <edge from-layer="806" from-port="2" to-layer="807" to-port="0" /> <edge from-layer="807" from-port="1" to-layer="808" to-port="1" /> <edge from-layer="808" from-port="2" to-layer="810" to-port="0" /> <edge from-layer="809" from-port="0" to-layer="810" to-port="1" /> <edge from-layer="810" from-port="2" to-layer="812" to-port="0" /> <edge from-layer="811" from-port="0" to-layer="812" to-port="1" /> <edge from-layer="812" from-port="2" to-layer="813" to-port="0" /> <edge from-layer="813" from-port="1" to-layer="814" to-port="0" /> <edge from-layer="813" from-port="1" to-layer="2619" to-port="1" /> <edge from-layer="815" from-port="0" to-layer="816" to-port="0" /> <edge from-layer="816" from-port="1" to-layer="819" to-port="0" /> <edge from-layer="817" from-port="0" to-layer="818" to-port="0" /> <edge from-layer="818" from-port="1" to-layer="819" to-port="1" /> <edge from-layer="819" from-port="2" to-layer="821" to-port="0" /> <edge from-layer="820" from-port="0" to-layer="821" to-port="1" /> <edge from-layer="821" from-port="2" to-layer="823" to-port="0" /> <edge from-layer="822" from-port="0" to-layer="823" to-port="1" /> <edge from-layer="823" from-port="2" to-layer="824" to-port="0" /> <edge from-layer="824" from-port="1" to-layer="825" to-port="1" /> <edge from-layer="825" from-port="2" to-layer="827" to-port="0" /> <edge from-layer="826" from-port="0" to-layer="827" to-port="1" /> <edge from-layer="827" from-port="2" to-layer="829" to-port="0" /> <edge from-layer="828" from-port="0" to-layer="829" to-port="1" /> <edge from-layer="829" from-port="2" to-layer="830" to-port="0" /> <edge from-layer="830" from-port="1" to-layer="831" to-port="0" /> <edge from-layer="830" from-port="1" to-layer="1245" to-port="1" /> <edge from-layer="832" from-port="0" to-layer="833" to-port="0" /> <edge from-layer="833" from-port="1" to-layer="836" to-port="0" /> <edge from-layer="834" from-port="0" to-layer="835" to-port="0" /> <edge from-layer="835" from-port="1" to-layer="836" to-port="1" /> <edge from-layer="836" from-port="2" to-layer="838" to-port="0" /> <edge from-layer="837" from-port="0" to-layer="838" to-port="1" /> <edge from-layer="838" from-port="2" to-layer="840" to-port="0" /> <edge from-layer="839" from-port="0" to-layer="840" to-port="1" /> <edge from-layer="840" from-port="2" to-layer="841" to-port="0" /> <edge from-layer="841" from-port="1" to-layer="842" to-port="1" /> <edge from-layer="842" from-port="2" to-layer="844" to-port="0" /> <edge from-layer="843" from-port="0" to-layer="844" to-port="1" /> <edge from-layer="844" from-port="2" to-layer="846" to-port="0" /> <edge from-layer="845" from-port="0" to-layer="846" to-port="1" /> <edge from-layer="846" from-port="2" to-layer="848" to-port="0" /> <edge from-layer="847" from-port="0" to-layer="848" to-port="1" /> <edge from-layer="848" from-port="2" to-layer="849" to-port="0" /> <edge from-layer="849" from-port="1" to-layer="3979" to-port="2" /> <edge from-layer="849" from-port="1" to-layer="850" to-port="0" /> <edge from-layer="851" from-port="0" to-layer="852" to-port="0" /> <edge from-layer="852" from-port="1" to-layer="855" to-port="0" /> <edge from-layer="853" from-port="0" to-layer="854" to-port="0" /> <edge from-layer="854" from-port="1" to-layer="855" to-port="1" /> <edge from-layer="855" from-port="2" to-layer="857" to-port="0" /> <edge from-layer="856" from-port="0" to-layer="857" to-port="1" /> <edge from-layer="857" from-port="2" to-layer="859" to-port="0" /> <edge from-layer="858" from-port="0" to-layer="859" to-port="1" /> <edge from-layer="859" from-port="2" to-layer="860" to-port="0" /> <edge from-layer="860" from-port="1" to-layer="861" to-port="1" /> <edge from-layer="861" from-port="2" to-layer="863" to-port="0" /> <edge from-layer="862" from-port="0" to-layer="863" to-port="1" /> <edge from-layer="863" from-port="2" to-layer="865" to-port="0" /> <edge from-layer="864" from-port="0" to-layer="865" to-port="1" /> <edge from-layer="865" from-port="2" to-layer="866" to-port="0" /> <edge from-layer="866" from-port="1" to-layer="4149" to-port="1" /> <edge from-layer="866" from-port="1" to-layer="867" to-port="0" /> <edge from-layer="868" from-port="0" to-layer="877" to-port="0" /> <edge from-layer="869" from-port="1" to-layer="872" to-port="0" /> <edge from-layer="870" from-port="0" to-layer="872" to-port="1" /> <edge from-layer="871" from-port="0" to-layer="872" to-port="2" /> <edge from-layer="872" from-port="3" to-layer="1835" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="1860" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2724" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="1495" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="1690" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="1665" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="1520" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2005" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="1350" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="1325" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="1180" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="1155" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2699" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3719" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4594" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4764" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4569" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4424" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4399" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4911" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4254" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4229" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4084" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4059" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2555" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3914" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2517" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3889" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3744" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="4739" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2370" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3574" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2345" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3549" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3404" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3379" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2200" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3234" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3209" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2175" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3064" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="3039" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2894" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2030" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="2869" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="942" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="876" to-port="0" /> <edge from-layer="872" from-port="3" to-layer="967" to-port="0" /> <edge from-layer="873" from-port="0" to-layer="876" to-port="1" /> <edge from-layer="874" from-port="0" to-layer="876" to-port="2" /> <edge from-layer="875" from-port="0" to-layer="876" to-port="3" /> <edge from-layer="876" from-port="4" to-layer="877" to-port="1" /> <edge from-layer="877" from-port="2" to-layer="878" to-port="0" /> <edge from-layer="878" from-port="1" to-layer="880" to-port="0" /> <edge from-layer="879" from-port="0" to-layer="880" to-port="2" /> <edge from-layer="880" from-port="3" to-layer="2511" to-port="0" /> <edge from-layer="881" from-port="0" to-layer="882" to-port="0" /> <edge from-layer="882" from-port="1" to-layer="885" to-port="0" /> <edge from-layer="883" from-port="0" to-layer="884" to-port="0" /> <edge from-layer="884" from-port="1" to-layer="885" to-port="1" /> <edge from-layer="885" from-port="2" to-layer="887" to-port="0" /> <edge from-layer="886" from-port="0" to-layer="887" to-port="1" /> <edge from-layer="887" from-port="2" to-layer="888" to-port="0" /> <edge from-layer="888" from-port="1" to-layer="5083" to-port="1" /> <edge from-layer="888" from-port="1" to-layer="893" to-port="0" /> <edge from-layer="889" from-port="0" to-layer="890" to-port="1" /> <edge from-layer="890" from-port="2" to-layer="891" to-port="0" /> <edge from-layer="891" from-port="1" to-layer="893" to-port="1" /> <edge from-layer="892" from-port="0" to-layer="893" to-port="2" /> <edge from-layer="893" from-port="3" to-layer="914" to-port="0" /> <edge from-layer="894" from-port="0" to-layer="895" to-port="0" /> <edge from-layer="895" from-port="1" to-layer="898" to-port="0" /> <edge from-layer="896" from-port="0" to-layer="897" to-port="0" /> <edge from-layer="897" from-port="1" to-layer="898" to-port="1" /> <edge from-layer="898" from-port="2" to-layer="900" to-port="0" /> <edge from-layer="899" from-port="0" to-layer="900" to-port="1" /> <edge from-layer="900" from-port="2" to-layer="901" to-port="0" /> <edge from-layer="901" from-port="1" to-layer="913" to-port="0" /> <edge from-layer="902" from-port="0" to-layer="1018" to-port="1" /> <edge from-layer="902" from-port="0" to-layer="903" to-port="1" /> <edge from-layer="903" from-port="2" to-layer="910" to-port="0" /> <edge from-layer="904" from-port="1" to-layer="907" to-port="0" /> <edge from-layer="904" from-port="1" to-layer="998" to-port="0" /> <edge from-layer="905" from-port="0" to-layer="907" to-port="1" /> <edge from-layer="906" from-port="0" to-layer="907" to-port="2" /> <edge from-layer="907" from-port="3" to-layer="909" to-port="0" /> <edge from-layer="907" from-port="3" to-layer="1024" to-port="0" /> <edge from-layer="908" from-port="0" to-layer="909" to-port="1" /> <edge from-layer="909" from-port="2" to-layer="910" to-port="1" /> <edge from-layer="910" from-port="2" to-layer="911" to-port="0" /> <edge from-layer="911" from-port="1" to-layer="913" to-port="1" /> <edge from-layer="912" from-port="0" to-layer="913" to-port="2" /> <edge from-layer="913" from-port="3" to-layer="914" to-port="1" /> <edge from-layer="914" from-port="2" to-layer="1051" to-port="0" /> <edge from-layer="914" from-port="2" to-layer="916" to-port="0" /> <edge from-layer="915" from-port="0" to-layer="916" to-port="1" /> <edge from-layer="916" from-port="2" to-layer="918" to-port="0" /> <edge from-layer="917" from-port="0" to-layer="918" to-port="1" /> <edge from-layer="918" from-port="2" to-layer="920" to-port="0" /> <edge from-layer="919" from-port="0" to-layer="920" to-port="1" /> <edge from-layer="920" from-port="2" to-layer="982" to-port="0" /> <edge from-layer="920" from-port="2" to-layer="931" to-port="0" /> <edge from-layer="920" from-port="2" to-layer="957" to-port="0" /> <edge from-layer="921" from-port="0" to-layer="922" to-port="0" /> <edge from-layer="922" from-port="1" to-layer="925" to-port="0" /> <edge from-layer="923" from-port="0" to-layer="924" to-port="0" /> <edge from-layer="924" from-port="1" to-layer="925" to-port="1" /> <edge from-layer="925" from-port="2" to-layer="927" to-port="0" /> <edge from-layer="926" from-port="0" to-layer="927" to-port="1" /> <edge from-layer="927" from-port="2" to-layer="929" to-port="0" /> <edge from-layer="928" from-port="0" to-layer="929" to-port="1" /> <edge from-layer="929" from-port="2" to-layer="930" to-port="0" /> <edge from-layer="930" from-port="1" to-layer="931" to-port="1" /> <edge from-layer="931" from-port="2" to-layer="933" to-port="0" /> <edge from-layer="932" from-port="0" to-layer="933" to-port="1" /> <edge from-layer="933" from-port="2" to-layer="935" to-port="0" /> <edge from-layer="934" from-port="0" to-layer="935" to-port="1" /> <edge from-layer="935" from-port="2" to-layer="937" to-port="0" /> <edge from-layer="936" from-port="0" to-layer="937" to-port="1" /> <edge from-layer="937" from-port="2" to-layer="1033" to-port="0" /> <edge from-layer="938" from-port="0" to-layer="943" to-port="0" /> <edge from-layer="939" from-port="0" to-layer="942" to-port="1" /> <edge from-layer="940" from-port="0" to-layer="942" to-port="2" /> <edge from-layer="941" from-port="0" to-layer="942" to-port="3" /> <edge from-layer="942" from-port="4" to-layer="943" to-port="1" /> <edge from-layer="943" from-port="2" to-layer="944" to-port="0" /> <edge from-layer="944" from-port="1" to-layer="946" to-port="0" /> <edge from-layer="945" from-port="0" to-layer="946" to-port="2" /> <edge from-layer="946" from-port="3" to-layer="992" to-port="0" /> <edge from-layer="946" from-port="3" to-layer="962" to-port="0" /> <edge from-layer="947" from-port="0" to-layer="948" to-port="0" /> <edge from-layer="948" from-port="1" to-layer="951" to-port="0" /> <edge from-layer="949" from-port="0" to-layer="950" to-port="0" /> <edge from-layer="950" from-port="1" to-layer="951" to-port="1" /> <edge from-layer="951" from-port="2" to-layer="953" to-port="0" /> <edge from-layer="952" from-port="0" to-layer="953" to-port="1" /> <edge from-layer="953" from-port="2" to-layer="955" to-port="0" /> <edge from-layer="954" from-port="0" to-layer="955" to-port="1" /> <edge from-layer="955" from-port="2" to-layer="956" to-port="0" /> <edge from-layer="956" from-port="1" to-layer="957" to-port="1" /> <edge from-layer="957" from-port="2" to-layer="959" to-port="0" /> <edge from-layer="958" from-port="0" to-layer="959" to-port="1" /> <edge from-layer="959" from-port="2" to-layer="961" to-port="0" /> <edge from-layer="960" from-port="0" to-layer="961" to-port="1" /> <edge from-layer="961" from-port="2" to-layer="962" to-port="1" /> <edge from-layer="962" from-port="2" to-layer="4964" to-port="0" /> <edge from-layer="962" from-port="2" to-layer="1033" to-port="1" /> <edge from-layer="963" from-port="0" to-layer="968" to-port="0" /> <edge from-layer="964" from-port="0" to-layer="967" to-port="1" /> <edge from-layer="965" from-port="0" to-layer="967" to-port="2" /> <edge from-layer="966" from-port="0" to-layer="967" to-port="3" /> <edge from-layer="967" from-port="4" to-layer="968" to-port="1" /> <edge from-layer="968" from-port="2" to-layer="969" to-port="0" /> <edge from-layer="969" from-port="1" to-layer="971" to-port="0" /> <edge from-layer="970" from-port="0" to-layer="971" to-port="2" /> <edge from-layer="971" from-port="3" to-layer="989" to-port="0" /> <edge from-layer="972" from-port="0" to-layer="973" to-port="0" /> <edge from-layer="973" from-port="1" to-layer="976" to-port="0" /> <edge from-layer="974" from-port="0" to-layer="975" to-port="0" /> <edge from-layer="975" from-port="1" to-layer="976" to-port="1" /> <edge from-layer="976" from-port="2" to-layer="978" to-port="0" /> <edge from-layer="977" from-port="0" to-layer="978" to-port="1" /> <edge from-layer="978" from-port="2" to-layer="980" to-port="0" /> <edge from-layer="979" from-port="0" to-layer="980" to-port="1" /> <edge from-layer="980" from-port="2" to-layer="981" to-port="0" /> <edge from-layer="981" from-port="1" to-layer="982" to-port="1" /> <edge from-layer="982" from-port="2" to-layer="984" to-port="0" /> <edge from-layer="983" from-port="0" to-layer="984" to-port="1" /> <edge from-layer="984" from-port="2" to-layer="986" to-port="0" /> <edge from-layer="985" from-port="0" to-layer="986" to-port="1" /> <edge from-layer="986" from-port="2" to-layer="988" to-port="0" /> <edge from-layer="987" from-port="0" to-layer="988" to-port="1" /> <edge from-layer="988" from-port="2" to-layer="989" to-port="1" /> <edge from-layer="989" from-port="2" to-layer="1033" to-port="2" /> <edge from-layer="989" from-port="2" to-layer="4963" to-port="0" /> <edge from-layer="990" from-port="0" to-layer="1009" to-port="0" /> <edge from-layer="991" from-port="0" to-layer="1003" to-port="0" /> <edge from-layer="992" from-port="1" to-layer="995" to-port="0" /> <edge from-layer="993" from-port="0" to-layer="995" to-port="1" /> <edge from-layer="994" from-port="0" to-layer="995" to-port="2" /> <edge from-layer="995" from-port="3" to-layer="1028" to-port="0" /> <edge from-layer="995" from-port="3" to-layer="999" to-port="0" /> <edge from-layer="996" from-port="0" to-layer="998" to-port="1" /> <edge from-layer="997" from-port="0" to-layer="998" to-port="2" /> <edge from-layer="998" from-port="3" to-layer="1012" to-port="0" /> <edge from-layer="998" from-port="3" to-layer="999" to-port="1" /> <edge from-layer="999" from-port="2" to-layer="1001" to-port="0" /> <edge from-layer="1000" from-port="0" to-layer="1001" to-port="1" /> <edge from-layer="1001" from-port="2" to-layer="1003" to-port="1" /> <edge from-layer="1001" from-port="2" to-layer="1014" to-port="0" /> <edge from-layer="1002" from-port="0" to-layer="1003" to-port="2" /> <edge from-layer="1003" from-port="3" to-layer="1004" to-port="0" /> <edge from-layer="1004" from-port="1" to-layer="1007" to-port="0" /> <edge from-layer="1005" from-port="0" to-layer="1006" to-port="1" /> <edge from-layer="1006" from-port="2" to-layer="1007" to-port="1" /> <edge from-layer="1007" from-port="2" to-layer="1008" to-port="0" /> <edge from-layer="1008" from-port="1" to-layer="1009" to-port="1" /> <edge from-layer="1009" from-port="2" to-layer="1010" to-port="0" /> <edge from-layer="1009" from-port="2" to-layer="1017" to-port="0" /> <edge from-layer="1010" from-port="1" to-layer="1016" to-port="0" /> <edge from-layer="1011" from-port="0" to-layer="1012" to-port="1" /> <edge from-layer="1012" from-port="2" to-layer="1029" to-port="1" /> <edge from-layer="1012" from-port="2" to-layer="1015" to-port="0" /> <edge from-layer="1013" from-port="0" to-layer="1014" to-port="1" /> <edge from-layer="1014" from-port="2" to-layer="1015" to-port="1" /> <edge from-layer="1015" from-port="2" to-layer="1016" to-port="1" /> <edge from-layer="1016" from-port="2" to-layer="1017" to-port="1" /> <edge from-layer="1017" from-port="2" to-layer="1018" to-port="0" /> <edge from-layer="1018" from-port="2" to-layer="1020" to-port="0" /> <edge from-layer="1019" from-port="0" to-layer="1020" to-port="1" /> <edge from-layer="1020" from-port="2" to-layer="1025" to-port="0" /> <edge from-layer="1021" from-port="0" to-layer="1024" to-port="1" /> <edge from-layer="1022" from-port="0" to-layer="1024" to-port="2" /> <edge from-layer="1023" from-port="0" to-layer="1024" to-port="3" /> <edge from-layer="1024" from-port="4" to-layer="1025" to-port="1" /> <edge from-layer="1025" from-port="2" to-layer="1032" to-port="0" /> <edge from-layer="1026" from-port="0" to-layer="1032" to-port="1" /> <edge from-layer="1027" from-port="0" to-layer="1028" to-port="1" /> <edge from-layer="1028" from-port="2" to-layer="1029" to-port="0" /> <edge from-layer="1029" from-port="2" to-layer="1032" to-port="2" /> <edge from-layer="1030" from-port="0" to-layer="1032" to-port="3" /> <edge from-layer="1031" from-port="0" to-layer="1032" to-port="4" /> <edge from-layer="1032" from-port="5" to-layer="3597" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="3767" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="3087" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="3937" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="4107" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="4277" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="1203" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="4447" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="4617" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="4787" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="3427" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="1033" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="3257" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="2053" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="2917" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="2747" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="1883" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="1713" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="1543" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="1373" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="2223" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="2393" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="2577" to-port="3" /> <edge from-layer="1032" from-port="5" to-layer="4982" to-port="3" /> <edge from-layer="1033" from-port="4" to-layer="1035" to-port="0" /> <edge from-layer="1034" from-port="0" to-layer="1035" to-port="1" /> <edge from-layer="1035" from-port="2" to-layer="1037" to-port="0" /> <edge from-layer="1036" from-port="0" to-layer="1037" to-port="1" /> <edge from-layer="1037" from-port="2" to-layer="1048" to-port="0" /> <edge from-layer="1038" from-port="0" to-layer="1039" to-port="0" /> <edge from-layer="1039" from-port="1" to-layer="1042" to-port="0" /> <edge from-layer="1040" from-port="0" to-layer="1041" to-port="0" /> <edge from-layer="1041" from-port="1" to-layer="1042" to-port="1" /> <edge from-layer="1042" from-port="2" to-layer="1044" to-port="0" /> <edge from-layer="1043" from-port="0" to-layer="1044" to-port="1" /> <edge from-layer="1044" from-port="2" to-layer="1046" to-port="0" /> <edge from-layer="1045" from-port="0" to-layer="1046" to-port="1" /> <edge from-layer="1046" from-port="2" to-layer="1047" to-port="0" /> <edge from-layer="1047" from-port="1" to-layer="1048" to-port="1" /> <edge from-layer="1048" from-port="2" to-layer="1050" to-port="0" /> <edge from-layer="1049" from-port="0" to-layer="1050" to-port="1" /> <edge from-layer="1050" from-port="2" to-layer="1051" to-port="1" /> <edge from-layer="1051" from-port="2" to-layer="1053" to-port="0" /> <edge from-layer="1051" from-port="2" to-layer="1093" to-port="0" /> <edge from-layer="1052" from-port="0" to-layer="1053" to-port="1" /> <edge from-layer="1053" from-port="2" to-layer="1055" to-port="0" /> <edge from-layer="1054" from-port="0" to-layer="1055" to-port="1" /> <edge from-layer="1055" from-port="2" to-layer="1057" to-port="0" /> <edge from-layer="1056" from-port="0" to-layer="1057" to-port="1" /> <edge from-layer="1057" from-port="2" to-layer="1068" to-port="0" /> <edge from-layer="1058" from-port="0" to-layer="1059" to-port="0" /> <edge from-layer="1059" from-port="1" to-layer="1062" to-port="0" /> <edge from-layer="1060" from-port="0" to-layer="1061" to-port="0" /> <edge from-layer="1061" from-port="1" to-layer="1062" to-port="1" /> <edge from-layer="1062" from-port="2" to-layer="1064" to-port="0" /> <edge from-layer="1063" from-port="0" to-layer="1064" to-port="1" /> <edge from-layer="1064" from-port="2" to-layer="1066" to-port="0" /> <edge from-layer="1065" from-port="0" to-layer="1066" to-port="1" /> <edge from-layer="1066" from-port="2" to-layer="1067" to-port="0" /> <edge from-layer="1067" from-port="1" to-layer="1068" to-port="1" /> <edge from-layer="1068" from-port="2" to-layer="1070" to-port="0" /> <edge from-layer="1069" from-port="0" to-layer="1070" to-port="1" /> <edge from-layer="1070" from-port="2" to-layer="1072" to-port="0" /> <edge from-layer="1071" from-port="0" to-layer="1072" to-port="1" /> <edge from-layer="1072" from-port="2" to-layer="1074" to-port="0" /> <edge from-layer="1073" from-port="0" to-layer="1074" to-port="1" /> <edge from-layer="1074" from-port="2" to-layer="1075" to-port="0" /> <edge from-layer="1075" from-port="3" to-layer="1077" to-port="0" /> <edge from-layer="1076" from-port="0" to-layer="1077" to-port="1" /> <edge from-layer="1077" from-port="2" to-layer="1079" to-port="0" /> <edge from-layer="1078" from-port="0" to-layer="1079" to-port="1" /> <edge from-layer="1079" from-port="2" to-layer="1090" to-port="0" /> <edge from-layer="1080" from-port="0" to-layer="1081" to-port="0" /> <edge from-layer="1081" from-port="1" to-layer="1084" to-port="0" /> <edge from-layer="1082" from-port="0" to-layer="1083" to-port="0" /> <edge from-layer="1083" from-port="1" to-layer="1084" to-port="1" /> <edge from-layer="1084" from-port="2" to-layer="1086" to-port="0" /> <edge from-layer="1085" from-port="0" to-layer="1086" to-port="1" /> <edge from-layer="1086" from-port="2" to-layer="1088" to-port="0" /> <edge from-layer="1087" from-port="0" to-layer="1088" to-port="1" /> <edge from-layer="1088" from-port="2" to-layer="1089" to-port="0" /> <edge from-layer="1089" from-port="1" to-layer="1090" to-port="1" /> <edge from-layer="1090" from-port="2" to-layer="1092" to-port="0" /> <edge from-layer="1091" from-port="0" to-layer="1092" to-port="1" /> <edge from-layer="1092" from-port="2" to-layer="1093" to-port="1" /> <edge from-layer="1093" from-port="2" to-layer="1127" to-port="0" /> <edge from-layer="1093" from-port="2" to-layer="1095" to-port="0" /> <edge from-layer="1094" from-port="0" to-layer="1095" to-port="1" /> <edge from-layer="1095" from-port="2" to-layer="1097" to-port="0" /> <edge from-layer="1096" from-port="0" to-layer="1097" to-port="1" /> <edge from-layer="1097" from-port="2" to-layer="1099" to-port="0" /> <edge from-layer="1098" from-port="0" to-layer="1099" to-port="1" /> <edge from-layer="1099" from-port="2" to-layer="1110" to-port="0" /> <edge from-layer="1100" from-port="0" to-layer="1101" to-port="0" /> <edge from-layer="1101" from-port="1" to-layer="1104" to-port="0" /> <edge from-layer="1102" from-port="0" to-layer="1103" to-port="0" /> <edge from-layer="1103" from-port="1" to-layer="1104" to-port="1" /> <edge from-layer="1104" from-port="2" to-layer="1106" to-port="0" /> <edge from-layer="1105" from-port="0" to-layer="1106" to-port="1" /> <edge from-layer="1106" from-port="2" to-layer="1108" to-port="0" /> <edge from-layer="1107" from-port="0" to-layer="1108" to-port="1" /> <edge from-layer="1108" from-port="2" to-layer="1109" to-port="0" /> <edge from-layer="1109" from-port="1" to-layer="1110" to-port="1" /> <edge from-layer="1110" from-port="2" to-layer="1112" to-port="0" /> <edge from-layer="1111" from-port="0" to-layer="1112" to-port="1" /> <edge from-layer="1112" from-port="2" to-layer="1113" to-port="0" /> <edge from-layer="1113" from-port="1" to-layer="1124" to-port="0" /> <edge from-layer="1114" from-port="0" to-layer="1115" to-port="0" /> <edge from-layer="1115" from-port="1" to-layer="1118" to-port="0" /> <edge from-layer="1116" from-port="0" to-layer="1117" to-port="0" /> <edge from-layer="1117" from-port="1" to-layer="1118" to-port="1" /> <edge from-layer="1118" from-port="2" to-layer="1120" to-port="0" /> <edge from-layer="1119" from-port="0" to-layer="1120" to-port="1" /> <edge from-layer="1120" from-port="2" to-layer="1122" to-port="0" /> <edge from-layer="1121" from-port="0" to-layer="1122" to-port="1" /> <edge from-layer="1122" from-port="2" to-layer="1123" to-port="0" /> <edge from-layer="1123" from-port="1" to-layer="1124" to-port="1" /> <edge from-layer="1124" from-port="2" to-layer="1126" to-port="0" /> <edge from-layer="1125" from-port="0" to-layer="1126" to-port="1" /> <edge from-layer="1126" from-port="2" to-layer="1127" to-port="1" /> <edge from-layer="1127" from-port="2" to-layer="1129" to-port="0" /> <edge from-layer="1127" from-port="2" to-layer="1221" to-port="0" /> <edge from-layer="1128" from-port="0" to-layer="1129" to-port="1" /> <edge from-layer="1129" from-port="2" to-layer="1131" to-port="0" /> <edge from-layer="1130" from-port="0" to-layer="1131" to-port="1" /> <edge from-layer="1131" from-port="2" to-layer="1133" to-port="0" /> <edge from-layer="1132" from-port="0" to-layer="1133" to-port="1" /> <edge from-layer="1133" from-port="2" to-layer="1195" to-port="0" /> <edge from-layer="1133" from-port="2" to-layer="1144" to-port="0" /> <edge from-layer="1133" from-port="2" to-layer="1170" to-port="0" /> <edge from-layer="1134" from-port="0" to-layer="1135" to-port="0" /> <edge from-layer="1135" from-port="1" to-layer="1138" to-port="0" /> <edge from-layer="1136" from-port="0" to-layer="1137" to-port="0" /> <edge from-layer="1137" from-port="1" to-layer="1138" to-port="1" /> <edge from-layer="1138" from-port="2" to-layer="1140" to-port="0" /> <edge from-layer="1139" from-port="0" to-layer="1140" to-port="1" /> <edge from-layer="1140" from-port="2" to-layer="1142" to-port="0" /> <edge from-layer="1141" from-port="0" to-layer="1142" to-port="1" /> <edge from-layer="1142" from-port="2" to-layer="1143" to-port="0" /> <edge from-layer="1143" from-port="1" to-layer="1144" to-port="1" /> <edge from-layer="1144" from-port="2" to-layer="1146" to-port="0" /> <edge from-layer="1145" from-port="0" to-layer="1146" to-port="1" /> <edge from-layer="1146" from-port="2" to-layer="1148" to-port="0" /> <edge from-layer="1147" from-port="0" to-layer="1148" to-port="1" /> <edge from-layer="1148" from-port="2" to-layer="1150" to-port="0" /> <edge from-layer="1149" from-port="0" to-layer="1150" to-port="1" /> <edge from-layer="1150" from-port="2" to-layer="1203" to-port="0" /> <edge from-layer="1151" from-port="0" to-layer="1156" to-port="0" /> <edge from-layer="1152" from-port="0" to-layer="1155" to-port="1" /> <edge from-layer="1153" from-port="0" to-layer="1155" to-port="2" /> <edge from-layer="1154" from-port="0" to-layer="1155" to-port="3" /> <edge from-layer="1155" from-port="4" to-layer="1156" to-port="1" /> <edge from-layer="1156" from-port="2" to-layer="1157" to-port="0" /> <edge from-layer="1157" from-port="1" to-layer="1159" to-port="0" /> <edge from-layer="1158" from-port="0" to-layer="1159" to-port="2" /> <edge from-layer="1159" from-port="3" to-layer="1175" to-port="0" /> <edge from-layer="1160" from-port="0" to-layer="1161" to-port="0" /> <edge from-layer="1161" from-port="1" to-layer="1164" to-port="0" /> <edge from-layer="1162" from-port="0" to-layer="1163" to-port="0" /> <edge from-layer="1163" from-port="1" to-layer="1164" to-port="1" /> <edge from-layer="1164" from-port="2" to-layer="1166" to-port="0" /> <edge from-layer="1165" from-port="0" to-layer="1166" to-port="1" /> <edge from-layer="1166" from-port="2" to-layer="1168" to-port="0" /> <edge from-layer="1167" from-port="0" to-layer="1168" to-port="1" /> <edge from-layer="1168" from-port="2" to-layer="1169" to-port="0" /> <edge from-layer="1169" from-port="1" to-layer="1170" to-port="1" /> <edge from-layer="1170" from-port="2" to-layer="1172" to-port="0" /> <edge from-layer="1171" from-port="0" to-layer="1172" to-port="1" /> <edge from-layer="1172" from-port="2" to-layer="1174" to-port="0" /> <edge from-layer="1173" from-port="0" to-layer="1174" to-port="1" /> <edge from-layer="1174" from-port="2" to-layer="1175" to-port="1" /> <edge from-layer="1175" from-port="2" to-layer="1203" to-port="1" /> <edge from-layer="1175" from-port="2" to-layer="4962" to-port="0" /> <edge from-layer="1176" from-port="0" to-layer="1181" to-port="0" /> <edge from-layer="1177" from-port="0" to-layer="1180" to-port="1" /> <edge from-layer="1178" from-port="0" to-layer="1180" to-port="2" /> <edge from-layer="1179" from-port="0" to-layer="1180" to-port="3" /> <edge from-layer="1180" from-port="4" to-layer="1181" to-port="1" /> <edge from-layer="1181" from-port="2" to-layer="1182" to-port="0" /> <edge from-layer="1182" from-port="1" to-layer="1184" to-port="0" /> <edge from-layer="1183" from-port="0" to-layer="1184" to-port="2" /> <edge from-layer="1184" from-port="3" to-layer="1202" to-port="0" /> <edge from-layer="1185" from-port="0" to-layer="1186" to-port="0" /> <edge from-layer="1186" from-port="1" to-layer="1189" to-port="0" /> <edge from-layer="1187" from-port="0" to-layer="1188" to-port="0" /> <edge from-layer="1188" from-port="1" to-layer="1189" to-port="1" /> <edge from-layer="1189" from-port="2" to-layer="1191" to-port="0" /> <edge from-layer="1190" from-port="0" to-layer="1191" to-port="1" /> <edge from-layer="1191" from-port="2" to-layer="1193" to-port="0" /> <edge from-layer="1192" from-port="0" to-layer="1193" to-port="1" /> <edge from-layer="1193" from-port="2" to-layer="1194" to-port="0" /> <edge from-layer="1194" from-port="1" to-layer="1195" to-port="1" /> <edge from-layer="1195" from-port="2" to-layer="1197" to-port="0" /> <edge from-layer="1196" from-port="0" to-layer="1197" to-port="1" /> <edge from-layer="1197" from-port="2" to-layer="1199" to-port="0" /> <edge from-layer="1198" from-port="0" to-layer="1199" to-port="1" /> <edge from-layer="1199" from-port="2" to-layer="1201" to-port="0" /> <edge from-layer="1200" from-port="0" to-layer="1201" to-port="1" /> <edge from-layer="1201" from-port="2" to-layer="1202" to-port="1" /> <edge from-layer="1202" from-port="2" to-layer="1203" to-port="2" /> <edge from-layer="1202" from-port="2" to-layer="4961" to-port="0" /> <edge from-layer="1203" from-port="4" to-layer="1205" to-port="0" /> <edge from-layer="1204" from-port="0" to-layer="1205" to-port="1" /> <edge from-layer="1205" from-port="2" to-layer="1207" to-port="0" /> <edge from-layer="1206" from-port="0" to-layer="1207" to-port="1" /> <edge from-layer="1207" from-port="2" to-layer="1218" to-port="0" /> <edge from-layer="1208" from-port="0" to-layer="1209" to-port="0" /> <edge from-layer="1209" from-port="1" to-layer="1212" to-port="0" /> <edge from-layer="1210" from-port="0" to-layer="1211" to-port="0" /> <edge from-layer="1211" from-port="1" to-layer="1212" to-port="1" /> <edge from-layer="1212" from-port="2" to-layer="1214" to-port="0" /> <edge from-layer="1213" from-port="0" to-layer="1214" to-port="1" /> <edge from-layer="1214" from-port="2" to-layer="1216" to-port="0" /> <edge from-layer="1215" from-port="0" to-layer="1216" to-port="1" /> <edge from-layer="1216" from-port="2" to-layer="1217" to-port="0" /> <edge from-layer="1217" from-port="1" to-layer="1218" to-port="1" /> <edge from-layer="1218" from-port="2" to-layer="1220" to-port="0" /> <edge from-layer="1219" from-port="0" to-layer="1220" to-port="1" /> <edge from-layer="1220" from-port="2" to-layer="1221" to-port="1" /> <edge from-layer="1221" from-port="2" to-layer="1223" to-port="0" /> <edge from-layer="1221" from-port="2" to-layer="1263" to-port="0" /> <edge from-layer="1222" from-port="0" to-layer="1223" to-port="1" /> <edge from-layer="1223" from-port="2" to-layer="1225" to-port="0" /> <edge from-layer="1224" from-port="0" to-layer="1225" to-port="1" /> <edge from-layer="1225" from-port="2" to-layer="1227" to-port="0" /> <edge from-layer="1226" from-port="0" to-layer="1227" to-port="1" /> <edge from-layer="1227" from-port="2" to-layer="1238" to-port="0" /> <edge from-layer="1228" from-port="0" to-layer="1229" to-port="0" /> <edge from-layer="1229" from-port="1" to-layer="1232" to-port="0" /> <edge from-layer="1230" from-port="0" to-layer="1231" to-port="0" /> <edge from-layer="1231" from-port="1" to-layer="1232" to-port="1" /> <edge from-layer="1232" from-port="2" to-layer="1234" to-port="0" /> <edge from-layer="1233" from-port="0" to-layer="1234" to-port="1" /> <edge from-layer="1234" from-port="2" to-layer="1236" to-port="0" /> <edge from-layer="1235" from-port="0" to-layer="1236" to-port="1" /> <edge from-layer="1236" from-port="2" to-layer="1237" to-port="0" /> <edge from-layer="1237" from-port="1" to-layer="1238" to-port="1" /> <edge from-layer="1238" from-port="2" to-layer="1240" to-port="0" /> <edge from-layer="1239" from-port="0" to-layer="1240" to-port="1" /> <edge from-layer="1240" from-port="2" to-layer="1242" to-port="0" /> <edge from-layer="1241" from-port="0" to-layer="1242" to-port="1" /> <edge from-layer="1242" from-port="2" to-layer="1244" to-port="0" /> <edge from-layer="1243" from-port="0" to-layer="1244" to-port="1" /> <edge from-layer="1244" from-port="2" to-layer="1245" to-port="0" /> <edge from-layer="1245" from-port="3" to-layer="1247" to-port="0" /> <edge from-layer="1246" from-port="0" to-layer="1247" to-port="1" /> <edge from-layer="1247" from-port="2" to-layer="1249" to-port="0" /> <edge from-layer="1248" from-port="0" to-layer="1249" to-port="1" /> <edge from-layer="1249" from-port="2" to-layer="1260" to-port="0" /> <edge from-layer="1250" from-port="0" to-layer="1251" to-port="0" /> <edge from-layer="1251" from-port="1" to-layer="1254" to-port="0" /> <edge from-layer="1252" from-port="0" to-layer="1253" to-port="0" /> <edge from-layer="1253" from-port="1" to-layer="1254" to-port="1" /> <edge from-layer="1254" from-port="2" to-layer="1256" to-port="0" /> <edge from-layer="1255" from-port="0" to-layer="1256" to-port="1" /> <edge from-layer="1256" from-port="2" to-layer="1258" to-port="0" /> <edge from-layer="1257" from-port="0" to-layer="1258" to-port="1" /> <edge from-layer="1258" from-port="2" to-layer="1259" to-port="0" /> <edge from-layer="1259" from-port="1" to-layer="1260" to-port="1" /> <edge from-layer="1260" from-port="2" to-layer="1262" to-port="0" /> <edge from-layer="1261" from-port="0" to-layer="1262" to-port="1" /> <edge from-layer="1262" from-port="2" to-layer="1263" to-port="1" /> <edge from-layer="1263" from-port="2" to-layer="1297" to-port="0" /> <edge from-layer="1263" from-port="2" to-layer="1265" to-port="0" /> <edge from-layer="1264" from-port="0" to-layer="1265" to-port="1" /> <edge from-layer="1265" from-port="2" to-layer="1267" to-port="0" /> <edge from-layer="1266" from-port="0" to-layer="1267" to-port="1" /> <edge from-layer="1267" from-port="2" to-layer="1269" to-port="0" /> <edge from-layer="1268" from-port="0" to-layer="1269" to-port="1" /> <edge from-layer="1269" from-port="2" to-layer="1280" to-port="0" /> <edge from-layer="1270" from-port="0" to-layer="1271" to-port="0" /> <edge from-layer="1271" from-port="1" to-layer="1274" to-port="0" /> <edge from-layer="1272" from-port="0" to-layer="1273" to-port="0" /> <edge from-layer="1273" from-port="1" to-layer="1274" to-port="1" /> <edge from-layer="1274" from-port="2" to-layer="1276" to-port="0" /> <edge from-layer="1275" from-port="0" to-layer="1276" to-port="1" /> <edge from-layer="1276" from-port="2" to-layer="1278" to-port="0" /> <edge from-layer="1277" from-port="0" to-layer="1278" to-port="1" /> <edge from-layer="1278" from-port="2" to-layer="1279" to-port="0" /> <edge from-layer="1279" from-port="1" to-layer="1280" to-port="1" /> <edge from-layer="1280" from-port="2" to-layer="1282" to-port="0" /> <edge from-layer="1281" from-port="0" to-layer="1282" to-port="1" /> <edge from-layer="1282" from-port="2" to-layer="1283" to-port="0" /> <edge from-layer="1283" from-port="1" to-layer="1294" to-port="0" /> <edge from-layer="1284" from-port="0" to-layer="1285" to-port="0" /> <edge from-layer="1285" from-port="1" to-layer="1288" to-port="0" /> <edge from-layer="1286" from-port="0" to-layer="1287" to-port="0" /> <edge from-layer="1287" from-port="1" to-layer="1288" to-port="1" /> <edge from-layer="1288" from-port="2" to-layer="1290" to-port="0" /> <edge from-layer="1289" from-port="0" to-layer="1290" to-port="1" /> <edge from-layer="1290" from-port="2" to-layer="1292" to-port="0" /> <edge from-layer="1291" from-port="0" to-layer="1292" to-port="1" /> <edge from-layer="1292" from-port="2" to-layer="1293" to-port="0" /> <edge from-layer="1293" from-port="1" to-layer="1294" to-port="1" /> <edge from-layer="1294" from-port="2" to-layer="1296" to-port="0" /> <edge from-layer="1295" from-port="0" to-layer="1296" to-port="1" /> <edge from-layer="1296" from-port="2" to-layer="1297" to-port="1" /> <edge from-layer="1297" from-port="2" to-layer="1299" to-port="0" /> <edge from-layer="1297" from-port="2" to-layer="1391" to-port="0" /> <edge from-layer="1298" from-port="0" to-layer="1299" to-port="1" /> <edge from-layer="1299" from-port="2" to-layer="1301" to-port="0" /> <edge from-layer="1300" from-port="0" to-layer="1301" to-port="1" /> <edge from-layer="1301" from-port="2" to-layer="1303" to-port="0" /> <edge from-layer="1302" from-port="0" to-layer="1303" to-port="1" /> <edge from-layer="1303" from-port="2" to-layer="1314" to-port="0" /> <edge from-layer="1303" from-port="2" to-layer="1340" to-port="0" /> <edge from-layer="1303" from-port="2" to-layer="1365" to-port="0" /> <edge from-layer="1304" from-port="0" to-layer="1305" to-port="0" /> <edge from-layer="1305" from-port="1" to-layer="1308" to-port="0" /> <edge from-layer="1306" from-port="0" to-layer="1307" to-port="0" /> <edge from-layer="1307" from-port="1" to-layer="1308" to-port="1" /> <edge from-layer="1308" from-port="2" to-layer="1310" to-port="0" /> <edge from-layer="1309" from-port="0" to-layer="1310" to-port="1" /> <edge from-layer="1310" from-port="2" to-layer="1312" to-port="0" /> <edge from-layer="1311" from-port="0" to-layer="1312" to-port="1" /> <edge from-layer="1312" from-port="2" to-layer="1313" to-port="0" /> <edge from-layer="1313" from-port="1" to-layer="1314" to-port="1" /> <edge from-layer="1314" from-port="2" to-layer="1316" to-port="0" /> <edge from-layer="1315" from-port="0" to-layer="1316" to-port="1" /> <edge from-layer="1316" from-port="2" to-layer="1318" to-port="0" /> <edge from-layer="1317" from-port="0" to-layer="1318" to-port="1" /> <edge from-layer="1318" from-port="2" to-layer="1320" to-port="0" /> <edge from-layer="1319" from-port="0" to-layer="1320" to-port="1" /> <edge from-layer="1320" from-port="2" to-layer="1373" to-port="0" /> <edge from-layer="1321" from-port="0" to-layer="1326" to-port="0" /> <edge from-layer="1322" from-port="0" to-layer="1325" to-port="1" /> <edge from-layer="1323" from-port="0" to-layer="1325" to-port="2" /> <edge from-layer="1324" from-port="0" to-layer="1325" to-port="3" /> <edge from-layer="1325" from-port="4" to-layer="1326" to-port="1" /> <edge from-layer="1326" from-port="2" to-layer="1327" to-port="0" /> <edge from-layer="1327" from-port="1" to-layer="1329" to-port="0" /> <edge from-layer="1328" from-port="0" to-layer="1329" to-port="2" /> <edge from-layer="1329" from-port="3" to-layer="1345" to-port="0" /> <edge from-layer="1330" from-port="0" to-layer="1331" to-port="0" /> <edge from-layer="1331" from-port="1" to-layer="1334" to-port="0" /> <edge from-layer="1332" from-port="0" to-layer="1333" to-port="0" /> <edge from-layer="1333" from-port="1" to-layer="1334" to-port="1" /> <edge from-layer="1334" from-port="2" to-layer="1336" to-port="0" /> <edge from-layer="1335" from-port="0" to-layer="1336" to-port="1" /> <edge from-layer="1336" from-port="2" to-layer="1338" to-port="0" /> <edge from-layer="1337" from-port="0" to-layer="1338" to-port="1" /> <edge from-layer="1338" from-port="2" to-layer="1339" to-port="0" /> <edge from-layer="1339" from-port="1" to-layer="1340" to-port="1" /> <edge from-layer="1340" from-port="2" to-layer="1342" to-port="0" /> <edge from-layer="1341" from-port="0" to-layer="1342" to-port="1" /> <edge from-layer="1342" from-port="2" to-layer="1344" to-port="0" /> <edge from-layer="1343" from-port="0" to-layer="1344" to-port="1" /> <edge from-layer="1344" from-port="2" to-layer="1345" to-port="1" /> <edge from-layer="1345" from-port="2" to-layer="1373" to-port="1" /> <edge from-layer="1345" from-port="2" to-layer="4940" to-port="0" /> <edge from-layer="1346" from-port="0" to-layer="1351" to-port="0" /> <edge from-layer="1347" from-port="0" to-layer="1350" to-port="1" /> <edge from-layer="1348" from-port="0" to-layer="1350" to-port="2" /> <edge from-layer="1349" from-port="0" to-layer="1350" to-port="3" /> <edge from-layer="1350" from-port="4" to-layer="1351" to-port="1" /> <edge from-layer="1351" from-port="2" to-layer="1352" to-port="0" /> <edge from-layer="1352" from-port="1" to-layer="1354" to-port="0" /> <edge from-layer="1353" from-port="0" to-layer="1354" to-port="2" /> <edge from-layer="1354" from-port="3" to-layer="1372" to-port="0" /> <edge from-layer="1355" from-port="0" to-layer="1356" to-port="0" /> <edge from-layer="1356" from-port="1" to-layer="1359" to-port="0" /> <edge from-layer="1357" from-port="0" to-layer="1358" to-port="0" /> <edge from-layer="1358" from-port="1" to-layer="1359" to-port="1" /> <edge from-layer="1359" from-port="2" to-layer="1361" to-port="0" /> <edge from-layer="1360" from-port="0" to-layer="1361" to-port="1" /> <edge from-layer="1361" from-port="2" to-layer="1363" to-port="0" /> <edge from-layer="1362" from-port="0" to-layer="1363" to-port="1" /> <edge from-layer="1363" from-port="2" to-layer="1364" to-port="0" /> <edge from-layer="1364" from-port="1" to-layer="1365" to-port="1" /> <edge from-layer="1365" from-port="2" to-layer="1367" to-port="0" /> <edge from-layer="1366" from-port="0" to-layer="1367" to-port="1" /> <edge from-layer="1367" from-port="2" to-layer="1369" to-port="0" /> <edge from-layer="1368" from-port="0" to-layer="1369" to-port="1" /> <edge from-layer="1369" from-port="2" to-layer="1371" to-port="0" /> <edge from-layer="1370" from-port="0" to-layer="1371" to-port="1" /> <edge from-layer="1371" from-port="2" to-layer="1372" to-port="1" /> <edge from-layer="1372" from-port="2" to-layer="4939" to-port="0" /> <edge from-layer="1372" from-port="2" to-layer="1373" to-port="2" /> <edge from-layer="1373" from-port="4" to-layer="1375" to-port="0" /> <edge from-layer="1374" from-port="0" to-layer="1375" to-port="1" /> <edge from-layer="1375" from-port="2" to-layer="1377" to-port="0" /> <edge from-layer="1376" from-port="0" to-layer="1377" to-port="1" /> <edge from-layer="1377" from-port="2" to-layer="1388" to-port="0" /> <edge from-layer="1378" from-port="0" to-layer="1379" to-port="0" /> <edge from-layer="1379" from-port="1" to-layer="1382" to-port="0" /> <edge from-layer="1380" from-port="0" to-layer="1381" to-port="0" /> <edge from-layer="1381" from-port="1" to-layer="1382" to-port="1" /> <edge from-layer="1382" from-port="2" to-layer="1384" to-port="0" /> <edge from-layer="1383" from-port="0" to-layer="1384" to-port="1" /> <edge from-layer="1384" from-port="2" to-layer="1386" to-port="0" /> <edge from-layer="1385" from-port="0" to-layer="1386" to-port="1" /> <edge from-layer="1386" from-port="2" to-layer="1387" to-port="0" /> <edge from-layer="1387" from-port="1" to-layer="1388" to-port="1" /> <edge from-layer="1388" from-port="2" to-layer="1390" to-port="0" /> <edge from-layer="1389" from-port="0" to-layer="1390" to-port="1" /> <edge from-layer="1390" from-port="2" to-layer="1391" to-port="1" /> <edge from-layer="1391" from-port="2" to-layer="1393" to-port="0" /> <edge from-layer="1391" from-port="2" to-layer="1433" to-port="0" /> <edge from-layer="1392" from-port="0" to-layer="1393" to-port="1" /> <edge from-layer="1393" from-port="2" to-layer="1395" to-port="0" /> <edge from-layer="1394" from-port="0" to-layer="1395" to-port="1" /> <edge from-layer="1395" from-port="2" to-layer="1397" to-port="0" /> <edge from-layer="1396" from-port="0" to-layer="1397" to-port="1" /> <edge from-layer="1397" from-port="2" to-layer="1408" to-port="0" /> <edge from-layer="1398" from-port="0" to-layer="1399" to-port="0" /> <edge from-layer="1399" from-port="1" to-layer="1402" to-port="0" /> <edge from-layer="1400" from-port="0" to-layer="1401" to-port="0" /> <edge from-layer="1401" from-port="1" to-layer="1402" to-port="1" /> <edge from-layer="1402" from-port="2" to-layer="1404" to-port="0" /> <edge from-layer="1403" from-port="0" to-layer="1404" to-port="1" /> <edge from-layer="1404" from-port="2" to-layer="1406" to-port="0" /> <edge from-layer="1405" from-port="0" to-layer="1406" to-port="1" /> <edge from-layer="1406" from-port="2" to-layer="1407" to-port="0" /> <edge from-layer="1407" from-port="1" to-layer="1408" to-port="1" /> <edge from-layer="1408" from-port="2" to-layer="1410" to-port="0" /> <edge from-layer="1409" from-port="0" to-layer="1410" to-port="1" /> <edge from-layer="1410" from-port="2" to-layer="1412" to-port="0" /> <edge from-layer="1411" from-port="0" to-layer="1412" to-port="1" /> <edge from-layer="1412" from-port="2" to-layer="1414" to-port="0" /> <edge from-layer="1413" from-port="0" to-layer="1414" to-port="1" /> <edge from-layer="1414" from-port="2" to-layer="1415" to-port="0" /> <edge from-layer="1415" from-port="3" to-layer="1417" to-port="0" /> <edge from-layer="1416" from-port="0" to-layer="1417" to-port="1" /> <edge from-layer="1417" from-port="2" to-layer="1419" to-port="0" /> <edge from-layer="1418" from-port="0" to-layer="1419" to-port="1" /> <edge from-layer="1419" from-port="2" to-layer="1430" to-port="0" /> <edge from-layer="1420" from-port="0" to-layer="1421" to-port="0" /> <edge from-layer="1421" from-port="1" to-layer="1424" to-port="0" /> <edge from-layer="1422" from-port="0" to-layer="1423" to-port="0" /> <edge from-layer="1423" from-port="1" to-layer="1424" to-port="1" /> <edge from-layer="1424" from-port="2" to-layer="1426" to-port="0" /> <edge from-layer="1425" from-port="0" to-layer="1426" to-port="1" /> <edge from-layer="1426" from-port="2" to-layer="1428" to-port="0" /> <edge from-layer="1427" from-port="0" to-layer="1428" to-port="1" /> <edge from-layer="1428" from-port="2" to-layer="1429" to-port="0" /> <edge from-layer="1429" from-port="1" to-layer="1430" to-port="1" /> <edge from-layer="1430" from-port="2" to-layer="1432" to-port="0" /> <edge from-layer="1431" from-port="0" to-layer="1432" to-port="1" /> <edge from-layer="1432" from-port="2" to-layer="1433" to-port="1" /> <edge from-layer="1433" from-port="2" to-layer="1435" to-port="0" /> <edge from-layer="1433" from-port="2" to-layer="1467" to-port="0" /> <edge from-layer="1434" from-port="0" to-layer="1435" to-port="1" /> <edge from-layer="1435" from-port="2" to-layer="1437" to-port="0" /> <edge from-layer="1436" from-port="0" to-layer="1437" to-port="1" /> <edge from-layer="1437" from-port="2" to-layer="1439" to-port="0" /> <edge from-layer="1438" from-port="0" to-layer="1439" to-port="1" /> <edge from-layer="1439" from-port="2" to-layer="1450" to-port="0" /> <edge from-layer="1440" from-port="0" to-layer="1441" to-port="0" /> <edge from-layer="1441" from-port="1" to-layer="1444" to-port="0" /> <edge from-layer="1442" from-port="0" to-layer="1443" to-port="0" /> <edge from-layer="1443" from-port="1" to-layer="1444" to-port="1" /> <edge from-layer="1444" from-port="2" to-layer="1446" to-port="0" /> <edge from-layer="1445" from-port="0" to-layer="1446" to-port="1" /> <edge from-layer="1446" from-port="2" to-layer="1448" to-port="0" /> <edge from-layer="1447" from-port="0" to-layer="1448" to-port="1" /> <edge from-layer="1448" from-port="2" to-layer="1449" to-port="0" /> <edge from-layer="1449" from-port="1" to-layer="1450" to-port="1" /> <edge from-layer="1450" from-port="2" to-layer="1452" to-port="0" /> <edge from-layer="1451" from-port="0" to-layer="1452" to-port="1" /> <edge from-layer="1452" from-port="2" to-layer="1453" to-port="0" /> <edge from-layer="1453" from-port="1" to-layer="1464" to-port="0" /> <edge from-layer="1454" from-port="0" to-layer="1455" to-port="0" /> <edge from-layer="1455" from-port="1" to-layer="1458" to-port="0" /> <edge from-layer="1456" from-port="0" to-layer="1457" to-port="0" /> <edge from-layer="1457" from-port="1" to-layer="1458" to-port="1" /> <edge from-layer="1458" from-port="2" to-layer="1460" to-port="0" /> <edge from-layer="1459" from-port="0" to-layer="1460" to-port="1" /> <edge from-layer="1460" from-port="2" to-layer="1462" to-port="0" /> <edge from-layer="1461" from-port="0" to-layer="1462" to-port="1" /> <edge from-layer="1462" from-port="2" to-layer="1463" to-port="0" /> <edge from-layer="1463" from-port="1" to-layer="1464" to-port="1" /> <edge from-layer="1464" from-port="2" to-layer="1466" to-port="0" /> <edge from-layer="1465" from-port="0" to-layer="1466" to-port="1" /> <edge from-layer="1466" from-port="2" to-layer="1467" to-port="1" /> <edge from-layer="1467" from-port="2" to-layer="1469" to-port="0" /> <edge from-layer="1467" from-port="2" to-layer="1561" to-port="0" /> <edge from-layer="1468" from-port="0" to-layer="1469" to-port="1" /> <edge from-layer="1469" from-port="2" to-layer="1471" to-port="0" /> <edge from-layer="1470" from-port="0" to-layer="1471" to-port="1" /> <edge from-layer="1471" from-port="2" to-layer="1473" to-port="0" /> <edge from-layer="1472" from-port="0" to-layer="1473" to-port="1" /> <edge from-layer="1473" from-port="2" to-layer="1535" to-port="0" /> <edge from-layer="1473" from-port="2" to-layer="1510" to-port="0" /> <edge from-layer="1473" from-port="2" to-layer="1484" to-port="0" /> <edge from-layer="1474" from-port="0" to-layer="1475" to-port="0" /> <edge from-layer="1475" from-port="1" to-layer="1478" to-port="0" /> <edge from-layer="1476" from-port="0" to-layer="1477" to-port="0" /> <edge from-layer="1477" from-port="1" to-layer="1478" to-port="1" /> <edge from-layer="1478" from-port="2" to-layer="1480" to-port="0" /> <edge from-layer="1479" from-port="0" to-layer="1480" to-port="1" /> <edge from-layer="1480" from-port="2" to-layer="1482" to-port="0" /> <edge from-layer="1481" from-port="0" to-layer="1482" to-port="1" /> <edge from-layer="1482" from-port="2" to-layer="1483" to-port="0" /> <edge from-layer="1483" from-port="1" to-layer="1484" to-port="1" /> <edge from-layer="1484" from-port="2" to-layer="1486" to-port="0" /> <edge from-layer="1485" from-port="0" to-layer="1486" to-port="1" /> <edge from-layer="1486" from-port="2" to-layer="1488" to-port="0" /> <edge from-layer="1487" from-port="0" to-layer="1488" to-port="1" /> <edge from-layer="1488" from-port="2" to-layer="1490" to-port="0" /> <edge from-layer="1489" from-port="0" to-layer="1490" to-port="1" /> <edge from-layer="1490" from-port="2" to-layer="1543" to-port="0" /> <edge from-layer="1491" from-port="0" to-layer="1496" to-port="0" /> <edge from-layer="1492" from-port="0" to-layer="1495" to-port="1" /> <edge from-layer="1493" from-port="0" to-layer="1495" to-port="2" /> <edge from-layer="1494" from-port="0" to-layer="1495" to-port="3" /> <edge from-layer="1495" from-port="4" to-layer="1496" to-port="1" /> <edge from-layer="1496" from-port="2" to-layer="1497" to-port="0" /> <edge from-layer="1497" from-port="1" to-layer="1499" to-port="0" /> <edge from-layer="1498" from-port="0" to-layer="1499" to-port="2" /> <edge from-layer="1499" from-port="3" to-layer="1515" to-port="0" /> <edge from-layer="1500" from-port="0" to-layer="1501" to-port="0" /> <edge from-layer="1501" from-port="1" to-layer="1504" to-port="0" /> <edge from-layer="1502" from-port="0" to-layer="1503" to-port="0" /> <edge from-layer="1503" from-port="1" to-layer="1504" to-port="1" /> <edge from-layer="1504" from-port="2" to-layer="1506" to-port="0" /> <edge from-layer="1505" from-port="0" to-layer="1506" to-port="1" /> <edge from-layer="1506" from-port="2" to-layer="1508" to-port="0" /> <edge from-layer="1507" from-port="0" to-layer="1508" to-port="1" /> <edge from-layer="1508" from-port="2" to-layer="1509" to-port="0" /> <edge from-layer="1509" from-port="1" to-layer="1510" to-port="1" /> <edge from-layer="1510" from-port="2" to-layer="1512" to-port="0" /> <edge from-layer="1511" from-port="0" to-layer="1512" to-port="1" /> <edge from-layer="1512" from-port="2" to-layer="1514" to-port="0" /> <edge from-layer="1513" from-port="0" to-layer="1514" to-port="1" /> <edge from-layer="1514" from-port="2" to-layer="1515" to-port="1" /> <edge from-layer="1515" from-port="2" to-layer="1543" to-port="1" /> <edge from-layer="1515" from-port="2" to-layer="2550" to-port="0" /> <edge from-layer="1516" from-port="0" to-layer="1521" to-port="0" /> <edge from-layer="1517" from-port="0" to-layer="1520" to-port="1" /> <edge from-layer="1518" from-port="0" to-layer="1520" to-port="2" /> <edge from-layer="1519" from-port="0" to-layer="1520" to-port="3" /> <edge from-layer="1520" from-port="4" to-layer="1521" to-port="1" /> <edge from-layer="1521" from-port="2" to-layer="1522" to-port="0" /> <edge from-layer="1522" from-port="1" to-layer="1524" to-port="0" /> <edge from-layer="1523" from-port="0" to-layer="1524" to-port="2" /> <edge from-layer="1524" from-port="3" to-layer="1542" to-port="0" /> <edge from-layer="1525" from-port="0" to-layer="1526" to-port="0" /> <edge from-layer="1526" from-port="1" to-layer="1529" to-port="0" /> <edge from-layer="1527" from-port="0" to-layer="1528" to-port="0" /> <edge from-layer="1528" from-port="1" to-layer="1529" to-port="1" /> <edge from-layer="1529" from-port="2" to-layer="1531" to-port="0" /> <edge from-layer="1530" from-port="0" to-layer="1531" to-port="1" /> <edge from-layer="1531" from-port="2" to-layer="1533" to-port="0" /> <edge from-layer="1532" from-port="0" to-layer="1533" to-port="1" /> <edge from-layer="1533" from-port="2" to-layer="1534" to-port="0" /> <edge from-layer="1534" from-port="1" to-layer="1535" to-port="1" /> <edge from-layer="1535" from-port="2" to-layer="1537" to-port="0" /> <edge from-layer="1536" from-port="0" to-layer="1537" to-port="1" /> <edge from-layer="1537" from-port="2" to-layer="1539" to-port="0" /> <edge from-layer="1538" from-port="0" to-layer="1539" to-port="1" /> <edge from-layer="1539" from-port="2" to-layer="1541" to-port="0" /> <edge from-layer="1540" from-port="0" to-layer="1541" to-port="1" /> <edge from-layer="1541" from-port="2" to-layer="1542" to-port="1" /> <edge from-layer="1542" from-port="2" to-layer="2549" to-port="0" /> <edge from-layer="1542" from-port="2" to-layer="1543" to-port="2" /> <edge from-layer="1543" from-port="4" to-layer="1545" to-port="0" /> <edge from-layer="1544" from-port="0" to-layer="1545" to-port="1" /> <edge from-layer="1545" from-port="2" to-layer="1547" to-port="0" /> <edge from-layer="1546" from-port="0" to-layer="1547" to-port="1" /> <edge from-layer="1547" from-port="2" to-layer="1558" to-port="0" /> <edge from-layer="1548" from-port="0" to-layer="1549" to-port="0" /> <edge from-layer="1549" from-port="1" to-layer="1552" to-port="0" /> <edge from-layer="1550" from-port="0" to-layer="1551" to-port="0" /> <edge from-layer="1551" from-port="1" to-layer="1552" to-port="1" /> <edge from-layer="1552" from-port="2" to-layer="1554" to-port="0" /> <edge from-layer="1553" from-port="0" to-layer="1554" to-port="1" /> <edge from-layer="1554" from-port="2" to-layer="1556" to-port="0" /> <edge from-layer="1555" from-port="0" to-layer="1556" to-port="1" /> <edge from-layer="1556" from-port="2" to-layer="1557" to-port="0" /> <edge from-layer="1557" from-port="1" to-layer="1558" to-port="1" /> <edge from-layer="1558" from-port="2" to-layer="1560" to-port="0" /> <edge from-layer="1559" from-port="0" to-layer="1560" to-port="1" /> <edge from-layer="1560" from-port="2" to-layer="1561" to-port="1" /> <edge from-layer="1561" from-port="2" to-layer="1603" to-port="0" /> <edge from-layer="1561" from-port="2" to-layer="1563" to-port="0" /> <edge from-layer="1562" from-port="0" to-layer="1563" to-port="1" /> <edge from-layer="1563" from-port="2" to-layer="1565" to-port="0" /> <edge from-layer="1564" from-port="0" to-layer="1565" to-port="1" /> <edge from-layer="1565" from-port="2" to-layer="1567" to-port="0" /> <edge from-layer="1566" from-port="0" to-layer="1567" to-port="1" /> <edge from-layer="1567" from-port="2" to-layer="1578" to-port="0" /> <edge from-layer="1568" from-port="0" to-layer="1569" to-port="0" /> <edge from-layer="1569" from-port="1" to-layer="1572" to-port="0" /> <edge from-layer="1570" from-port="0" to-layer="1571" to-port="0" /> <edge from-layer="1571" from-port="1" to-layer="1572" to-port="1" /> <edge from-layer="1572" from-port="2" to-layer="1574" to-port="0" /> <edge from-layer="1573" from-port="0" to-layer="1574" to-port="1" /> <edge from-layer="1574" from-port="2" to-layer="1576" to-port="0" /> <edge from-layer="1575" from-port="0" to-layer="1576" to-port="1" /> <edge from-layer="1576" from-port="2" to-layer="1577" to-port="0" /> <edge from-layer="1577" from-port="1" to-layer="1578" to-port="1" /> <edge from-layer="1578" from-port="2" to-layer="1580" to-port="0" /> <edge from-layer="1579" from-port="0" to-layer="1580" to-port="1" /> <edge from-layer="1580" from-port="2" to-layer="1582" to-port="0" /> <edge from-layer="1581" from-port="0" to-layer="1582" to-port="1" /> <edge from-layer="1582" from-port="2" to-layer="1584" to-port="0" /> <edge from-layer="1583" from-port="0" to-layer="1584" to-port="1" /> <edge from-layer="1584" from-port="2" to-layer="1585" to-port="0" /> <edge from-layer="1585" from-port="3" to-layer="1587" to-port="0" /> <edge from-layer="1586" from-port="0" to-layer="1587" to-port="1" /> <edge from-layer="1587" from-port="2" to-layer="1589" to-port="0" /> <edge from-layer="1588" from-port="0" to-layer="1589" to-port="1" /> <edge from-layer="1589" from-port="2" to-layer="1600" to-port="0" /> <edge from-layer="1590" from-port="0" to-layer="1591" to-port="0" /> <edge from-layer="1591" from-port="1" to-layer="1594" to-port="0" /> <edge from-layer="1592" from-port="0" to-layer="1593" to-port="0" /> <edge from-layer="1593" from-port="1" to-layer="1594" to-port="1" /> <edge from-layer="1594" from-port="2" to-layer="1596" to-port="0" /> <edge from-layer="1595" from-port="0" to-layer="1596" to-port="1" /> <edge from-layer="1596" from-port="2" to-layer="1598" to-port="0" /> <edge from-layer="1597" from-port="0" to-layer="1598" to-port="1" /> <edge from-layer="1598" from-port="2" to-layer="1599" to-port="0" /> <edge from-layer="1599" from-port="1" to-layer="1600" to-port="1" /> <edge from-layer="1600" from-port="2" to-layer="1602" to-port="0" /> <edge from-layer="1601" from-port="0" to-layer="1602" to-port="1" /> <edge from-layer="1602" from-port="2" to-layer="1603" to-port="1" /> <edge from-layer="1603" from-port="2" to-layer="1605" to-port="0" /> <edge from-layer="1603" from-port="2" to-layer="1637" to-port="0" /> <edge from-layer="1604" from-port="0" to-layer="1605" to-port="1" /> <edge from-layer="1605" from-port="2" to-layer="1607" to-port="0" /> <edge from-layer="1606" from-port="0" to-layer="1607" to-port="1" /> <edge from-layer="1607" from-port="2" to-layer="1609" to-port="0" /> <edge from-layer="1608" from-port="0" to-layer="1609" to-port="1" /> <edge from-layer="1609" from-port="2" to-layer="1620" to-port="0" /> <edge from-layer="1610" from-port="0" to-layer="1611" to-port="0" /> <edge from-layer="1611" from-port="1" to-layer="1614" to-port="0" /> <edge from-layer="1612" from-port="0" to-layer="1613" to-port="0" /> <edge from-layer="1613" from-port="1" to-layer="1614" to-port="1" /> <edge from-layer="1614" from-port="2" to-layer="1616" to-port="0" /> <edge from-layer="1615" from-port="0" to-layer="1616" to-port="1" /> <edge from-layer="1616" from-port="2" to-layer="1618" to-port="0" /> <edge from-layer="1617" from-port="0" to-layer="1618" to-port="1" /> <edge from-layer="1618" from-port="2" to-layer="1619" to-port="0" /> <edge from-layer="1619" from-port="1" to-layer="1620" to-port="1" /> <edge from-layer="1620" from-port="2" to-layer="1622" to-port="0" /> <edge from-layer="1621" from-port="0" to-layer="1622" to-port="1" /> <edge from-layer="1622" from-port="2" to-layer="1623" to-port="0" /> <edge from-layer="1623" from-port="1" to-layer="1634" to-port="0" /> <edge from-layer="1624" from-port="0" to-layer="1625" to-port="0" /> <edge from-layer="1625" from-port="1" to-layer="1628" to-port="0" /> <edge from-layer="1626" from-port="0" to-layer="1627" to-port="0" /> <edge from-layer="1627" from-port="1" to-layer="1628" to-port="1" /> <edge from-layer="1628" from-port="2" to-layer="1630" to-port="0" /> <edge from-layer="1629" from-port="0" to-layer="1630" to-port="1" /> <edge from-layer="1630" from-port="2" to-layer="1632" to-port="0" /> <edge from-layer="1631" from-port="0" to-layer="1632" to-port="1" /> <edge from-layer="1632" from-port="2" to-layer="1633" to-port="0" /> <edge from-layer="1633" from-port="1" to-layer="1634" to-port="1" /> <edge from-layer="1634" from-port="2" to-layer="1636" to-port="0" /> <edge from-layer="1635" from-port="0" to-layer="1636" to-port="1" /> <edge from-layer="1636" from-port="2" to-layer="1637" to-port="1" /> <edge from-layer="1637" from-port="2" to-layer="1731" to-port="0" /> <edge from-layer="1637" from-port="2" to-layer="1639" to-port="0" /> <edge from-layer="1638" from-port="0" to-layer="1639" to-port="1" /> <edge from-layer="1639" from-port="2" to-layer="1641" to-port="0" /> <edge from-layer="1640" from-port="0" to-layer="1641" to-port="1" /> <edge from-layer="1641" from-port="2" to-layer="1643" to-port="0" /> <edge from-layer="1642" from-port="0" to-layer="1643" to-port="1" /> <edge from-layer="1643" from-port="2" to-layer="1705" to-port="0" /> <edge from-layer="1643" from-port="2" to-layer="1680" to-port="0" /> <edge from-layer="1643" from-port="2" to-layer="1654" to-port="0" /> <edge from-layer="1644" from-port="0" to-layer="1645" to-port="0" /> <edge from-layer="1645" from-port="1" to-layer="1648" to-port="0" /> <edge from-layer="1646" from-port="0" to-layer="1647" to-port="0" /> <edge from-layer="1647" from-port="1" to-layer="1648" to-port="1" /> <edge from-layer="1648" from-port="2" to-layer="1650" to-port="0" /> <edge from-layer="1649" from-port="0" to-layer="1650" to-port="1" /> <edge from-layer="1650" from-port="2" to-layer="1652" to-port="0" /> <edge from-layer="1651" from-port="0" to-layer="1652" to-port="1" /> <edge from-layer="1652" from-port="2" to-layer="1653" to-port="0" /> <edge from-layer="1653" from-port="1" to-layer="1654" to-port="1" /> <edge from-layer="1654" from-port="2" to-layer="1656" to-port="0" /> <edge from-layer="1655" from-port="0" to-layer="1656" to-port="1" /> <edge from-layer="1656" from-port="2" to-layer="1658" to-port="0" /> <edge from-layer="1657" from-port="0" to-layer="1658" to-port="1" /> <edge from-layer="1658" from-port="2" to-layer="1660" to-port="0" /> <edge from-layer="1659" from-port="0" to-layer="1660" to-port="1" /> <edge from-layer="1660" from-port="2" to-layer="1713" to-port="0" /> <edge from-layer="1661" from-port="0" to-layer="1666" to-port="0" /> <edge from-layer="1662" from-port="0" to-layer="1665" to-port="1" /> <edge from-layer="1663" from-port="0" to-layer="1665" to-port="2" /> <edge from-layer="1664" from-port="0" to-layer="1665" to-port="3" /> <edge from-layer="1665" from-port="4" to-layer="1666" to-port="1" /> <edge from-layer="1666" from-port="2" to-layer="1667" to-port="0" /> <edge from-layer="1667" from-port="1" to-layer="1669" to-port="0" /> <edge from-layer="1668" from-port="0" to-layer="1669" to-port="2" /> <edge from-layer="1669" from-port="3" to-layer="1685" to-port="0" /> <edge from-layer="1670" from-port="0" to-layer="1671" to-port="0" /> <edge from-layer="1671" from-port="1" to-layer="1674" to-port="0" /> <edge from-layer="1672" from-port="0" to-layer="1673" to-port="0" /> <edge from-layer="1673" from-port="1" to-layer="1674" to-port="1" /> <edge from-layer="1674" from-port="2" to-layer="1676" to-port="0" /> <edge from-layer="1675" from-port="0" to-layer="1676" to-port="1" /> <edge from-layer="1676" from-port="2" to-layer="1678" to-port="0" /> <edge from-layer="1677" from-port="0" to-layer="1678" to-port="1" /> <edge from-layer="1678" from-port="2" to-layer="1679" to-port="0" /> <edge from-layer="1679" from-port="1" to-layer="1680" to-port="1" /> <edge from-layer="1680" from-port="2" to-layer="1682" to-port="0" /> <edge from-layer="1681" from-port="0" to-layer="1682" to-port="1" /> <edge from-layer="1682" from-port="2" to-layer="1684" to-port="0" /> <edge from-layer="1683" from-port="0" to-layer="1684" to-port="1" /> <edge from-layer="1684" from-port="2" to-layer="1685" to-port="1" /> <edge from-layer="1685" from-port="2" to-layer="1713" to-port="1" /> <edge from-layer="1685" from-port="2" to-layer="2548" to-port="0" /> <edge from-layer="1686" from-port="0" to-layer="1691" to-port="0" /> <edge from-layer="1687" from-port="0" to-layer="1690" to-port="1" /> <edge from-layer="1688" from-port="0" to-layer="1690" to-port="2" /> <edge from-layer="1689" from-port="0" to-layer="1690" to-port="3" /> <edge from-layer="1690" from-port="4" to-layer="1691" to-port="1" /> <edge from-layer="1691" from-port="2" to-layer="1692" to-port="0" /> <edge from-layer="1692" from-port="1" to-layer="1694" to-port="0" /> <edge from-layer="1693" from-port="0" to-layer="1694" to-port="2" /> <edge from-layer="1694" from-port="3" to-layer="1712" to-port="0" /> <edge from-layer="1695" from-port="0" to-layer="1696" to-port="0" /> <edge from-layer="1696" from-port="1" to-layer="1699" to-port="0" /> <edge from-layer="1697" from-port="0" to-layer="1698" to-port="0" /> <edge from-layer="1698" from-port="1" to-layer="1699" to-port="1" /> <edge from-layer="1699" from-port="2" to-layer="1701" to-port="0" /> <edge from-layer="1700" from-port="0" to-layer="1701" to-port="1" /> <edge from-layer="1701" from-port="2" to-layer="1703" to-port="0" /> <edge from-layer="1702" from-port="0" to-layer="1703" to-port="1" /> <edge from-layer="1703" from-port="2" to-layer="1704" to-port="0" /> <edge from-layer="1704" from-port="1" to-layer="1705" to-port="1" /> <edge from-layer="1705" from-port="2" to-layer="1707" to-port="0" /> <edge from-layer="1706" from-port="0" to-layer="1707" to-port="1" /> <edge from-layer="1707" from-port="2" to-layer="1709" to-port="0" /> <edge from-layer="1708" from-port="0" to-layer="1709" to-port="1" /> <edge from-layer="1709" from-port="2" to-layer="1711" to-port="0" /> <edge from-layer="1710" from-port="0" to-layer="1711" to-port="1" /> <edge from-layer="1711" from-port="2" to-layer="1712" to-port="1" /> <edge from-layer="1712" from-port="2" to-layer="2547" to-port="0" /> <edge from-layer="1712" from-port="2" to-layer="1713" to-port="2" /> <edge from-layer="1713" from-port="4" to-layer="1715" to-port="0" /> <edge from-layer="1714" from-port="0" to-layer="1715" to-port="1" /> <edge from-layer="1715" from-port="2" to-layer="1717" to-port="0" /> <edge from-layer="1716" from-port="0" to-layer="1717" to-port="1" /> <edge from-layer="1717" from-port="2" to-layer="1728" to-port="0" /> <edge from-layer="1718" from-port="0" to-layer="1719" to-port="0" /> <edge from-layer="1719" from-port="1" to-layer="1722" to-port="0" /> <edge from-layer="1720" from-port="0" to-layer="1721" to-port="0" /> <edge from-layer="1721" from-port="1" to-layer="1722" to-port="1" /> <edge from-layer="1722" from-port="2" to-layer="1724" to-port="0" /> <edge from-layer="1723" from-port="0" to-layer="1724" to-port="1" /> <edge from-layer="1724" from-port="2" to-layer="1726" to-port="0" /> <edge from-layer="1725" from-port="0" to-layer="1726" to-port="1" /> <edge from-layer="1726" from-port="2" to-layer="1727" to-port="0" /> <edge from-layer="1727" from-port="1" to-layer="1728" to-port="1" /> <edge from-layer="1728" from-port="2" to-layer="1730" to-port="0" /> <edge from-layer="1729" from-port="0" to-layer="1730" to-port="1" /> <edge from-layer="1730" from-port="2" to-layer="1731" to-port="1" /> <edge from-layer="1731" from-port="2" to-layer="1733" to-port="0" /> <edge from-layer="1731" from-port="2" to-layer="1773" to-port="0" /> <edge from-layer="1732" from-port="0" to-layer="1733" to-port="1" /> <edge from-layer="1733" from-port="2" to-layer="1735" to-port="0" /> <edge from-layer="1734" from-port="0" to-layer="1735" to-port="1" /> <edge from-layer="1735" from-port="2" to-layer="1737" to-port="0" /> <edge from-layer="1736" from-port="0" to-layer="1737" to-port="1" /> <edge from-layer="1737" from-port="2" to-layer="1748" to-port="0" /> <edge from-layer="1738" from-port="0" to-layer="1739" to-port="0" /> <edge from-layer="1739" from-port="1" to-layer="1742" to-port="0" /> <edge from-layer="1740" from-port="0" to-layer="1741" to-port="0" /> <edge from-layer="1741" from-port="1" to-layer="1742" to-port="1" /> <edge from-layer="1742" from-port="2" to-layer="1744" to-port="0" /> <edge from-layer="1743" from-port="0" to-layer="1744" to-port="1" /> <edge from-layer="1744" from-port="2" to-layer="1746" to-port="0" /> <edge from-layer="1745" from-port="0" to-layer="1746" to-port="1" /> <edge from-layer="1746" from-port="2" to-layer="1747" to-port="0" /> <edge from-layer="1747" from-port="1" to-layer="1748" to-port="1" /> <edge from-layer="1748" from-port="2" to-layer="1750" to-port="0" /> <edge from-layer="1749" from-port="0" to-layer="1750" to-port="1" /> <edge from-layer="1750" from-port="2" to-layer="1752" to-port="0" /> <edge from-layer="1751" from-port="0" to-layer="1752" to-port="1" /> <edge from-layer="1752" from-port="2" to-layer="1754" to-port="0" /> <edge from-layer="1753" from-port="0" to-layer="1754" to-port="1" /> <edge from-layer="1754" from-port="2" to-layer="1755" to-port="0" /> <edge from-layer="1755" from-port="3" to-layer="1757" to-port="0" /> <edge from-layer="1756" from-port="0" to-layer="1757" to-port="1" /> <edge from-layer="1757" from-port="2" to-layer="1759" to-port="0" /> <edge from-layer="1758" from-port="0" to-layer="1759" to-port="1" /> <edge from-layer="1759" from-port="2" to-layer="1770" to-port="0" /> <edge from-layer="1760" from-port="0" to-layer="1761" to-port="0" /> <edge from-layer="1761" from-port="1" to-layer="1764" to-port="0" /> <edge from-layer="1762" from-port="0" to-layer="1763" to-port="0" /> <edge from-layer="1763" from-port="1" to-layer="1764" to-port="1" /> <edge from-layer="1764" from-port="2" to-layer="1766" to-port="0" /> <edge from-layer="1765" from-port="0" to-layer="1766" to-port="1" /> <edge from-layer="1766" from-port="2" to-layer="1768" to-port="0" /> <edge from-layer="1767" from-port="0" to-layer="1768" to-port="1" /> <edge from-layer="1768" from-port="2" to-layer="1769" to-port="0" /> <edge from-layer="1769" from-port="1" to-layer="1770" to-port="1" /> <edge from-layer="1770" from-port="2" to-layer="1772" to-port="0" /> <edge from-layer="1771" from-port="0" to-layer="1772" to-port="1" /> <edge from-layer="1772" from-port="2" to-layer="1773" to-port="1" /> <edge from-layer="1773" from-port="2" to-layer="1807" to-port="0" /> <edge from-layer="1773" from-port="2" to-layer="1775" to-port="0" /> <edge from-layer="1774" from-port="0" to-layer="1775" to-port="1" /> <edge from-layer="1775" from-port="2" to-layer="1777" to-port="0" /> <edge from-layer="1776" from-port="0" to-layer="1777" to-port="1" /> <edge from-layer="1777" from-port="2" to-layer="1779" to-port="0" /> <edge from-layer="1778" from-port="0" to-layer="1779" to-port="1" /> <edge from-layer="1779" from-port="2" to-layer="1790" to-port="0" /> <edge from-layer="1780" from-port="0" to-layer="1781" to-port="0" /> <edge from-layer="1781" from-port="1" to-layer="1784" to-port="0" /> <edge from-layer="1782" from-port="0" to-layer="1783" to-port="0" /> <edge from-layer="1783" from-port="1" to-layer="1784" to-port="1" /> <edge from-layer="1784" from-port="2" to-layer="1786" to-port="0" /> <edge from-layer="1785" from-port="0" to-layer="1786" to-port="1" /> <edge from-layer="1786" from-port="2" to-layer="1788" to-port="0" /> <edge from-layer="1787" from-port="0" to-layer="1788" to-port="1" /> <edge from-layer="1788" from-port="2" to-layer="1789" to-port="0" /> <edge from-layer="1789" from-port="1" to-layer="1790" to-port="1" /> <edge from-layer="1790" from-port="2" to-layer="1792" to-port="0" /> <edge from-layer="1791" from-port="0" to-layer="1792" to-port="1" /> <edge from-layer="1792" from-port="2" to-layer="1793" to-port="0" /> <edge from-layer="1793" from-port="1" to-layer="1804" to-port="0" /> <edge from-layer="1794" from-port="0" to-layer="1795" to-port="0" /> <edge from-layer="1795" from-port="1" to-layer="1798" to-port="0" /> <edge from-layer="1796" from-port="0" to-layer="1797" to-port="0" /> <edge from-layer="1797" from-port="1" to-layer="1798" to-port="1" /> <edge from-layer="1798" from-port="2" to-layer="1800" to-port="0" /> <edge from-layer="1799" from-port="0" to-layer="1800" to-port="1" /> <edge from-layer="1800" from-port="2" to-layer="1802" to-port="0" /> <edge from-layer="1801" from-port="0" to-layer="1802" to-port="1" /> <edge from-layer="1802" from-port="2" to-layer="1803" to-port="0" /> <edge from-layer="1803" from-port="1" to-layer="1804" to-port="1" /> <edge from-layer="1804" from-port="2" to-layer="1806" to-port="0" /> <edge from-layer="1805" from-port="0" to-layer="1806" to-port="1" /> <edge from-layer="1806" from-port="2" to-layer="1807" to-port="1" /> <edge from-layer="1807" from-port="2" to-layer="1809" to-port="0" /> <edge from-layer="1807" from-port="2" to-layer="1901" to-port="0" /> <edge from-layer="1808" from-port="0" to-layer="1809" to-port="1" /> <edge from-layer="1809" from-port="2" to-layer="1811" to-port="0" /> <edge from-layer="1810" from-port="0" to-layer="1811" to-port="1" /> <edge from-layer="1811" from-port="2" to-layer="1813" to-port="0" /> <edge from-layer="1812" from-port="0" to-layer="1813" to-port="1" /> <edge from-layer="1813" from-port="2" to-layer="1875" to-port="0" /> <edge from-layer="1813" from-port="2" to-layer="1824" to-port="0" /> <edge from-layer="1813" from-port="2" to-layer="1850" to-port="0" /> <edge from-layer="1814" from-port="0" to-layer="1815" to-port="0" /> <edge from-layer="1815" from-port="1" to-layer="1818" to-port="0" /> <edge from-layer="1816" from-port="0" to-layer="1817" to-port="0" /> <edge from-layer="1817" from-port="1" to-layer="1818" to-port="1" /> <edge from-layer="1818" from-port="2" to-layer="1820" to-port="0" /> <edge from-layer="1819" from-port="0" to-layer="1820" to-port="1" /> <edge from-layer="1820" from-port="2" to-layer="1822" to-port="0" /> <edge from-layer="1821" from-port="0" to-layer="1822" to-port="1" /> <edge from-layer="1822" from-port="2" to-layer="1823" to-port="0" /> <edge from-layer="1823" from-port="1" to-layer="1824" to-port="1" /> <edge from-layer="1824" from-port="2" to-layer="1826" to-port="0" /> <edge from-layer="1825" from-port="0" to-layer="1826" to-port="1" /> <edge from-layer="1826" from-port="2" to-layer="1828" to-port="0" /> <edge from-layer="1827" from-port="0" to-layer="1828" to-port="1" /> <edge from-layer="1828" from-port="2" to-layer="1830" to-port="0" /> <edge from-layer="1829" from-port="0" to-layer="1830" to-port="1" /> <edge from-layer="1830" from-port="2" to-layer="1883" to-port="0" /> <edge from-layer="1831" from-port="0" to-layer="1836" to-port="0" /> <edge from-layer="1832" from-port="0" to-layer="1835" to-port="1" /> <edge from-layer="1833" from-port="0" to-layer="1835" to-port="2" /> <edge from-layer="1834" from-port="0" to-layer="1835" to-port="3" /> <edge from-layer="1835" from-port="4" to-layer="1836" to-port="1" /> <edge from-layer="1836" from-port="2" to-layer="1837" to-port="0" /> <edge from-layer="1837" from-port="1" to-layer="1839" to-port="0" /> <edge from-layer="1838" from-port="0" to-layer="1839" to-port="2" /> <edge from-layer="1839" from-port="3" to-layer="1855" to-port="0" /> <edge from-layer="1840" from-port="0" to-layer="1841" to-port="0" /> <edge from-layer="1841" from-port="1" to-layer="1844" to-port="0" /> <edge from-layer="1842" from-port="0" to-layer="1843" to-port="0" /> <edge from-layer="1843" from-port="1" to-layer="1844" to-port="1" /> <edge from-layer="1844" from-port="2" to-layer="1846" to-port="0" /> <edge from-layer="1845" from-port="0" to-layer="1846" to-port="1" /> <edge from-layer="1846" from-port="2" to-layer="1848" to-port="0" /> <edge from-layer="1847" from-port="0" to-layer="1848" to-port="1" /> <edge from-layer="1848" from-port="2" to-layer="1849" to-port="0" /> <edge from-layer="1849" from-port="1" to-layer="1850" to-port="1" /> <edge from-layer="1850" from-port="2" to-layer="1852" to-port="0" /> <edge from-layer="1851" from-port="0" to-layer="1852" to-port="1" /> <edge from-layer="1852" from-port="2" to-layer="1854" to-port="0" /> <edge from-layer="1853" from-port="0" to-layer="1854" to-port="1" /> <edge from-layer="1854" from-port="2" to-layer="1855" to-port="1" /> <edge from-layer="1855" from-port="2" to-layer="1883" to-port="1" /> <edge from-layer="1855" from-port="2" to-layer="2546" to-port="0" /> <edge from-layer="1856" from-port="0" to-layer="1861" to-port="0" /> <edge from-layer="1857" from-port="0" to-layer="1860" to-port="1" /> <edge from-layer="1858" from-port="0" to-layer="1860" to-port="2" /> <edge from-layer="1859" from-port="0" to-layer="1860" to-port="3" /> <edge from-layer="1860" from-port="4" to-layer="1861" to-port="1" /> <edge from-layer="1861" from-port="2" to-layer="1862" to-port="0" /> <edge from-layer="1862" from-port="1" to-layer="1864" to-port="0" /> <edge from-layer="1863" from-port="0" to-layer="1864" to-port="2" /> <edge from-layer="1864" from-port="3" to-layer="1882" to-port="0" /> <edge from-layer="1865" from-port="0" to-layer="1866" to-port="0" /> <edge from-layer="1866" from-port="1" to-layer="1869" to-port="0" /> <edge from-layer="1867" from-port="0" to-layer="1868" to-port="0" /> <edge from-layer="1868" from-port="1" to-layer="1869" to-port="1" /> <edge from-layer="1869" from-port="2" to-layer="1871" to-port="0" /> <edge from-layer="1870" from-port="0" to-layer="1871" to-port="1" /> <edge from-layer="1871" from-port="2" to-layer="1873" to-port="0" /> <edge from-layer="1872" from-port="0" to-layer="1873" to-port="1" /> <edge from-layer="1873" from-port="2" to-layer="1874" to-port="0" /> <edge from-layer="1874" from-port="1" to-layer="1875" to-port="1" /> <edge from-layer="1875" from-port="2" to-layer="1877" to-port="0" /> <edge from-layer="1876" from-port="0" to-layer="1877" to-port="1" /> <edge from-layer="1877" from-port="2" to-layer="1879" to-port="0" /> <edge from-layer="1878" from-port="0" to-layer="1879" to-port="1" /> <edge from-layer="1879" from-port="2" to-layer="1881" to-port="0" /> <edge from-layer="1880" from-port="0" to-layer="1881" to-port="1" /> <edge from-layer="1881" from-port="2" to-layer="1882" to-port="1" /> <edge from-layer="1882" from-port="2" to-layer="1883" to-port="2" /> <edge from-layer="1882" from-port="2" to-layer="2545" to-port="0" /> <edge from-layer="1883" from-port="4" to-layer="1885" to-port="0" /> <edge from-layer="1884" from-port="0" to-layer="1885" to-port="1" /> <edge from-layer="1885" from-port="2" to-layer="1887" to-port="0" /> <edge from-layer="1886" from-port="0" to-layer="1887" to-port="1" /> <edge from-layer="1887" from-port="2" to-layer="1898" to-port="0" /> <edge from-layer="1888" from-port="0" to-layer="1889" to-port="0" /> <edge from-layer="1889" from-port="1" to-layer="1892" to-port="0" /> <edge from-layer="1890" from-port="0" to-layer="1891" to-port="0" /> <edge from-layer="1891" from-port="1" to-layer="1892" to-port="1" /> <edge from-layer="1892" from-port="2" to-layer="1894" to-port="0" /> <edge from-layer="1893" from-port="0" to-layer="1894" to-port="1" /> <edge from-layer="1894" from-port="2" to-layer="1896" to-port="0" /> <edge from-layer="1895" from-port="0" to-layer="1896" to-port="1" /> <edge from-layer="1896" from-port="2" to-layer="1897" to-port="0" /> <edge from-layer="1897" from-port="1" to-layer="1898" to-port="1" /> <edge from-layer="1898" from-port="2" to-layer="1900" to-port="0" /> <edge from-layer="1899" from-port="0" to-layer="1900" to-port="1" /> <edge from-layer="1900" from-port="2" to-layer="1901" to-port="1" /> <edge from-layer="1901" from-port="2" to-layer="1903" to-port="0" /> <edge from-layer="1901" from-port="2" to-layer="1943" to-port="0" /> <edge from-layer="1902" from-port="0" to-layer="1903" to-port="1" /> <edge from-layer="1903" from-port="2" to-layer="1905" to-port="0" /> <edge from-layer="1904" from-port="0" to-layer="1905" to-port="1" /> <edge from-layer="1905" from-port="2" to-layer="1907" to-port="0" /> <edge from-layer="1906" from-port="0" to-layer="1907" to-port="1" /> <edge from-layer="1907" from-port="2" to-layer="1918" to-port="0" /> <edge from-layer="1908" from-port="0" to-layer="1909" to-port="0" /> <edge from-layer="1909" from-port="1" to-layer="1912" to-port="0" /> <edge from-layer="1910" from-port="0" to-layer="1911" to-port="0" /> <edge from-layer="1911" from-port="1" to-layer="1912" to-port="1" /> <edge from-layer="1912" from-port="2" to-layer="1914" to-port="0" /> <edge from-layer="1913" from-port="0" to-layer="1914" to-port="1" /> <edge from-layer="1914" from-port="2" to-layer="1916" to-port="0" /> <edge from-layer="1915" from-port="0" to-layer="1916" to-port="1" /> <edge from-layer="1916" from-port="2" to-layer="1917" to-port="0" /> <edge from-layer="1917" from-port="1" to-layer="1918" to-port="1" /> <edge from-layer="1918" from-port="2" to-layer="1920" to-port="0" /> <edge from-layer="1919" from-port="0" to-layer="1920" to-port="1" /> <edge from-layer="1920" from-port="2" to-layer="1922" to-port="0" /> <edge from-layer="1921" from-port="0" to-layer="1922" to-port="1" /> <edge from-layer="1922" from-port="2" to-layer="1924" to-port="0" /> <edge from-layer="1923" from-port="0" to-layer="1924" to-port="1" /> <edge from-layer="1924" from-port="2" to-layer="1925" to-port="0" /> <edge from-layer="1925" from-port="3" to-layer="1927" to-port="0" /> <edge from-layer="1926" from-port="0" to-layer="1927" to-port="1" /> <edge from-layer="1927" from-port="2" to-layer="1929" to-port="0" /> <edge from-layer="1928" from-port="0" to-layer="1929" to-port="1" /> <edge from-layer="1929" from-port="2" to-layer="1940" to-port="0" /> <edge from-layer="1930" from-port="0" to-layer="1931" to-port="0" /> <edge from-layer="1931" from-port="1" to-layer="1934" to-port="0" /> <edge from-layer="1932" from-port="0" to-layer="1933" to-port="0" /> <edge from-layer="1933" from-port="1" to-layer="1934" to-port="1" /> <edge from-layer="1934" from-port="2" to-layer="1936" to-port="0" /> <edge from-layer="1935" from-port="0" to-layer="1936" to-port="1" /> <edge from-layer="1936" from-port="2" to-layer="1938" to-port="0" /> <edge from-layer="1937" from-port="0" to-layer="1938" to-port="1" /> <edge from-layer="1938" from-port="2" to-layer="1939" to-port="0" /> <edge from-layer="1939" from-port="1" to-layer="1940" to-port="1" /> <edge from-layer="1940" from-port="2" to-layer="1942" to-port="0" /> <edge from-layer="1941" from-port="0" to-layer="1942" to-port="1" /> <edge from-layer="1942" from-port="2" to-layer="1943" to-port="1" /> <edge from-layer="1943" from-port="2" to-layer="1945" to-port="0" /> <edge from-layer="1943" from-port="2" to-layer="1977" to-port="0" /> <edge from-layer="1944" from-port="0" to-layer="1945" to-port="1" /> <edge from-layer="1945" from-port="2" to-layer="1947" to-port="0" /> <edge from-layer="1946" from-port="0" to-layer="1947" to-port="1" /> <edge from-layer="1947" from-port="2" to-layer="1949" to-port="0" /> <edge from-layer="1948" from-port="0" to-layer="1949" to-port="1" /> <edge from-layer="1949" from-port="2" to-layer="1960" to-port="0" /> <edge from-layer="1950" from-port="0" to-layer="1951" to-port="0" /> <edge from-layer="1951" from-port="1" to-layer="1954" to-port="0" /> <edge from-layer="1952" from-port="0" to-layer="1953" to-port="0" /> <edge from-layer="1953" from-port="1" to-layer="1954" to-port="1" /> <edge from-layer="1954" from-port="2" to-layer="1956" to-port="0" /> <edge from-layer="1955" from-port="0" to-layer="1956" to-port="1" /> <edge from-layer="1956" from-port="2" to-layer="1958" to-port="0" /> <edge from-layer="1957" from-port="0" to-layer="1958" to-port="1" /> <edge from-layer="1958" from-port="2" to-layer="1959" to-port="0" /> <edge from-layer="1959" from-port="1" to-layer="1960" to-port="1" /> <edge from-layer="1960" from-port="2" to-layer="1962" to-port="0" /> <edge from-layer="1961" from-port="0" to-layer="1962" to-port="1" /> <edge from-layer="1962" from-port="2" to-layer="1963" to-port="0" /> <edge from-layer="1963" from-port="1" to-layer="1974" to-port="0" /> <edge from-layer="1964" from-port="0" to-layer="1965" to-port="0" /> <edge from-layer="1965" from-port="1" to-layer="1968" to-port="0" /> <edge from-layer="1966" from-port="0" to-layer="1967" to-port="0" /> <edge from-layer="1967" from-port="1" to-layer="1968" to-port="1" /> <edge from-layer="1968" from-port="2" to-layer="1970" to-port="0" /> <edge from-layer="1969" from-port="0" to-layer="1970" to-port="1" /> <edge from-layer="1970" from-port="2" to-layer="1972" to-port="0" /> <edge from-layer="1971" from-port="0" to-layer="1972" to-port="1" /> <edge from-layer="1972" from-port="2" to-layer="1973" to-port="0" /> <edge from-layer="1973" from-port="1" to-layer="1974" to-port="1" /> <edge from-layer="1974" from-port="2" to-layer="1976" to-port="0" /> <edge from-layer="1975" from-port="0" to-layer="1976" to-port="1" /> <edge from-layer="1976" from-port="2" to-layer="1977" to-port="1" /> <edge from-layer="1977" from-port="2" to-layer="1979" to-port="0" /> <edge from-layer="1977" from-port="2" to-layer="2071" to-port="0" /> <edge from-layer="1978" from-port="0" to-layer="1979" to-port="1" /> <edge from-layer="1979" from-port="2" to-layer="1981" to-port="0" /> <edge from-layer="1980" from-port="0" to-layer="1981" to-port="1" /> <edge from-layer="1981" from-port="2" to-layer="1983" to-port="0" /> <edge from-layer="1982" from-port="0" to-layer="1983" to-port="1" /> <edge from-layer="1983" from-port="2" to-layer="2020" to-port="0" /> <edge from-layer="1983" from-port="2" to-layer="2045" to-port="0" /> <edge from-layer="1983" from-port="2" to-layer="1994" to-port="0" /> <edge from-layer="1984" from-port="0" to-layer="1985" to-port="0" /> <edge from-layer="1985" from-port="1" to-layer="1988" to-port="0" /> <edge from-layer="1986" from-port="0" to-layer="1987" to-port="0" /> <edge from-layer="1987" from-port="1" to-layer="1988" to-port="1" /> <edge from-layer="1988" from-port="2" to-layer="1990" to-port="0" /> <edge from-layer="1989" from-port="0" to-layer="1990" to-port="1" /> <edge from-layer="1990" from-port="2" to-layer="1992" to-port="0" /> <edge from-layer="1991" from-port="0" to-layer="1992" to-port="1" /> <edge from-layer="1992" from-port="2" to-layer="1993" to-port="0" /> <edge from-layer="1993" from-port="1" to-layer="1994" to-port="1" /> <edge from-layer="1994" from-port="2" to-layer="1996" to-port="0" /> <edge from-layer="1995" from-port="0" to-layer="1996" to-port="1" /> <edge from-layer="1996" from-port="2" to-layer="1998" to-port="0" /> <edge from-layer="1997" from-port="0" to-layer="1998" to-port="1" /> <edge from-layer="1998" from-port="2" to-layer="2000" to-port="0" /> <edge from-layer="1999" from-port="0" to-layer="2000" to-port="1" /> <edge from-layer="2000" from-port="2" to-layer="2053" to-port="0" /> <edge from-layer="2001" from-port="0" to-layer="2006" to-port="0" /> <edge from-layer="2002" from-port="0" to-layer="2005" to-port="1" /> <edge from-layer="2003" from-port="0" to-layer="2005" to-port="2" /> <edge from-layer="2004" from-port="0" to-layer="2005" to-port="3" /> <edge from-layer="2005" from-port="4" to-layer="2006" to-port="1" /> <edge from-layer="2006" from-port="2" to-layer="2007" to-port="0" /> <edge from-layer="2007" from-port="1" to-layer="2009" to-port="0" /> <edge from-layer="2008" from-port="0" to-layer="2009" to-port="2" /> <edge from-layer="2009" from-port="3" to-layer="2025" to-port="0" /> <edge from-layer="2010" from-port="0" to-layer="2011" to-port="0" /> <edge from-layer="2011" from-port="1" to-layer="2014" to-port="0" /> <edge from-layer="2012" from-port="0" to-layer="2013" to-port="0" /> <edge from-layer="2013" from-port="1" to-layer="2014" to-port="1" /> <edge from-layer="2014" from-port="2" to-layer="2016" to-port="0" /> <edge from-layer="2015" from-port="0" to-layer="2016" to-port="1" /> <edge from-layer="2016" from-port="2" to-layer="2018" to-port="0" /> <edge from-layer="2017" from-port="0" to-layer="2018" to-port="1" /> <edge from-layer="2018" from-port="2" to-layer="2019" to-port="0" /> <edge from-layer="2019" from-port="1" to-layer="2020" to-port="1" /> <edge from-layer="2020" from-port="2" to-layer="2022" to-port="0" /> <edge from-layer="2021" from-port="0" to-layer="2022" to-port="1" /> <edge from-layer="2022" from-port="2" to-layer="2024" to-port="0" /> <edge from-layer="2023" from-port="0" to-layer="2024" to-port="1" /> <edge from-layer="2024" from-port="2" to-layer="2025" to-port="1" /> <edge from-layer="2025" from-port="2" to-layer="2544" to-port="0" /> <edge from-layer="2025" from-port="2" to-layer="2053" to-port="1" /> <edge from-layer="2026" from-port="0" to-layer="2031" to-port="0" /> <edge from-layer="2027" from-port="0" to-layer="2030" to-port="1" /> <edge from-layer="2028" from-port="0" to-layer="2030" to-port="2" /> <edge from-layer="2029" from-port="0" to-layer="2030" to-port="3" /> <edge from-layer="2030" from-port="4" to-layer="2031" to-port="1" /> <edge from-layer="2031" from-port="2" to-layer="2032" to-port="0" /> <edge from-layer="2032" from-port="1" to-layer="2034" to-port="0" /> <edge from-layer="2033" from-port="0" to-layer="2034" to-port="2" /> <edge from-layer="2034" from-port="3" to-layer="2052" to-port="0" /> <edge from-layer="2035" from-port="0" to-layer="2036" to-port="0" /> <edge from-layer="2036" from-port="1" to-layer="2039" to-port="0" /> <edge from-layer="2037" from-port="0" to-layer="2038" to-port="0" /> <edge from-layer="2038" from-port="1" to-layer="2039" to-port="1" /> <edge from-layer="2039" from-port="2" to-layer="2041" to-port="0" /> <edge from-layer="2040" from-port="0" to-layer="2041" to-port="1" /> <edge from-layer="2041" from-port="2" to-layer="2043" to-port="0" /> <edge from-layer="2042" from-port="0" to-layer="2043" to-port="1" /> <edge from-layer="2043" from-port="2" to-layer="2044" to-port="0" /> <edge from-layer="2044" from-port="1" to-layer="2045" to-port="1" /> <edge from-layer="2045" from-port="2" to-layer="2047" to-port="0" /> <edge from-layer="2046" from-port="0" to-layer="2047" to-port="1" /> <edge from-layer="2047" from-port="2" to-layer="2049" to-port="0" /> <edge from-layer="2048" from-port="0" to-layer="2049" to-port="1" /> <edge from-layer="2049" from-port="2" to-layer="2051" to-port="0" /> <edge from-layer="2050" from-port="0" to-layer="2051" to-port="1" /> <edge from-layer="2051" from-port="2" to-layer="2052" to-port="1" /> <edge from-layer="2052" from-port="2" to-layer="2543" to-port="0" /> <edge from-layer="2052" from-port="2" to-layer="2053" to-port="2" /> <edge from-layer="2053" from-port="4" to-layer="2055" to-port="0" /> <edge from-layer="2054" from-port="0" to-layer="2055" to-port="1" /> <edge from-layer="2055" from-port="2" to-layer="2057" to-port="0" /> <edge from-layer="2056" from-port="0" to-layer="2057" to-port="1" /> <edge from-layer="2057" from-port="2" to-layer="2068" to-port="0" /> <edge from-layer="2058" from-port="0" to-layer="2059" to-port="0" /> <edge from-layer="2059" from-port="1" to-layer="2062" to-port="0" /> <edge from-layer="2060" from-port="0" to-layer="2061" to-port="0" /> <edge from-layer="2061" from-port="1" to-layer="2062" to-port="1" /> <edge from-layer="2062" from-port="2" to-layer="2064" to-port="0" /> <edge from-layer="2063" from-port="0" to-layer="2064" to-port="1" /> <edge from-layer="2064" from-port="2" to-layer="2066" to-port="0" /> <edge from-layer="2065" from-port="0" to-layer="2066" to-port="1" /> <edge from-layer="2066" from-port="2" to-layer="2067" to-port="0" /> <edge from-layer="2067" from-port="1" to-layer="2068" to-port="1" /> <edge from-layer="2068" from-port="2" to-layer="2070" to-port="0" /> <edge from-layer="2069" from-port="0" to-layer="2070" to-port="1" /> <edge from-layer="2070" from-port="2" to-layer="2071" to-port="1" /> <edge from-layer="2071" from-port="2" to-layer="2073" to-port="0" /> <edge from-layer="2071" from-port="2" to-layer="2113" to-port="0" /> <edge from-layer="2072" from-port="0" to-layer="2073" to-port="1" /> <edge from-layer="2073" from-port="2" to-layer="2075" to-port="0" /> <edge from-layer="2074" from-port="0" to-layer="2075" to-port="1" /> <edge from-layer="2075" from-port="2" to-layer="2077" to-port="0" /> <edge from-layer="2076" from-port="0" to-layer="2077" to-port="1" /> <edge from-layer="2077" from-port="2" to-layer="2088" to-port="0" /> <edge from-layer="2078" from-port="0" to-layer="2079" to-port="0" /> <edge from-layer="2079" from-port="1" to-layer="2082" to-port="0" /> <edge from-layer="2080" from-port="0" to-layer="2081" to-port="0" /> <edge from-layer="2081" from-port="1" to-layer="2082" to-port="1" /> <edge from-layer="2082" from-port="2" to-layer="2084" to-port="0" /> <edge from-layer="2083" from-port="0" to-layer="2084" to-port="1" /> <edge from-layer="2084" from-port="2" to-layer="2086" to-port="0" /> <edge from-layer="2085" from-port="0" to-layer="2086" to-port="1" /> <edge from-layer="2086" from-port="2" to-layer="2087" to-port="0" /> <edge from-layer="2087" from-port="1" to-layer="2088" to-port="1" /> <edge from-layer="2088" from-port="2" to-layer="2090" to-port="0" /> <edge from-layer="2089" from-port="0" to-layer="2090" to-port="1" /> <edge from-layer="2090" from-port="2" to-layer="2092" to-port="0" /> <edge from-layer="2091" from-port="0" to-layer="2092" to-port="1" /> <edge from-layer="2092" from-port="2" to-layer="2094" to-port="0" /> <edge from-layer="2093" from-port="0" to-layer="2094" to-port="1" /> <edge from-layer="2094" from-port="2" to-layer="2095" to-port="0" /> <edge from-layer="2095" from-port="3" to-layer="2097" to-port="0" /> <edge from-layer="2096" from-port="0" to-layer="2097" to-port="1" /> <edge from-layer="2097" from-port="2" to-layer="2099" to-port="0" /> <edge from-layer="2098" from-port="0" to-layer="2099" to-port="1" /> <edge from-layer="2099" from-port="2" to-layer="2110" to-port="0" /> <edge from-layer="2100" from-port="0" to-layer="2101" to-port="0" /> <edge from-layer="2101" from-port="1" to-layer="2104" to-port="0" /> <edge from-layer="2102" from-port="0" to-layer="2103" to-port="0" /> <edge from-layer="2103" from-port="1" to-layer="2104" to-port="1" /> <edge from-layer="2104" from-port="2" to-layer="2106" to-port="0" /> <edge from-layer="2105" from-port="0" to-layer="2106" to-port="1" /> <edge from-layer="2106" from-port="2" to-layer="2108" to-port="0" /> <edge from-layer="2107" from-port="0" to-layer="2108" to-port="1" /> <edge from-layer="2108" from-port="2" to-layer="2109" to-port="0" /> <edge from-layer="2109" from-port="1" to-layer="2110" to-port="1" /> <edge from-layer="2110" from-port="2" to-layer="2112" to-port="0" /> <edge from-layer="2111" from-port="0" to-layer="2112" to-port="1" /> <edge from-layer="2112" from-port="2" to-layer="2113" to-port="1" /> <edge from-layer="2113" from-port="2" to-layer="2115" to-port="0" /> <edge from-layer="2113" from-port="2" to-layer="2147" to-port="0" /> <edge from-layer="2114" from-port="0" to-layer="2115" to-port="1" /> <edge from-layer="2115" from-port="2" to-layer="2117" to-port="0" /> <edge from-layer="2116" from-port="0" to-layer="2117" to-port="1" /> <edge from-layer="2117" from-port="2" to-layer="2119" to-port="0" /> <edge from-layer="2118" from-port="0" to-layer="2119" to-port="1" /> <edge from-layer="2119" from-port="2" to-layer="2130" to-port="0" /> <edge from-layer="2120" from-port="0" to-layer="2121" to-port="0" /> <edge from-layer="2121" from-port="1" to-layer="2124" to-port="0" /> <edge from-layer="2122" from-port="0" to-layer="2123" to-port="0" /> <edge from-layer="2123" from-port="1" to-layer="2124" to-port="1" /> <edge from-layer="2124" from-port="2" to-layer="2126" to-port="0" /> <edge from-layer="2125" from-port="0" to-layer="2126" to-port="1" /> <edge from-layer="2126" from-port="2" to-layer="2128" to-port="0" /> <edge from-layer="2127" from-port="0" to-layer="2128" to-port="1" /> <edge from-layer="2128" from-port="2" to-layer="2129" to-port="0" /> <edge from-layer="2129" from-port="1" to-layer="2130" to-port="1" /> <edge from-layer="2130" from-port="2" to-layer="2132" to-port="0" /> <edge from-layer="2131" from-port="0" to-layer="2132" to-port="1" /> <edge from-layer="2132" from-port="2" to-layer="2133" to-port="0" /> <edge from-layer="2133" from-port="1" to-layer="2144" to-port="0" /> <edge from-layer="2134" from-port="0" to-layer="2135" to-port="0" /> <edge from-layer="2135" from-port="1" to-layer="2138" to-port="0" /> <edge from-layer="2136" from-port="0" to-layer="2137" to-port="0" /> <edge from-layer="2137" from-port="1" to-layer="2138" to-port="1" /> <edge from-layer="2138" from-port="2" to-layer="2140" to-port="0" /> <edge from-layer="2139" from-port="0" to-layer="2140" to-port="1" /> <edge from-layer="2140" from-port="2" to-layer="2142" to-port="0" /> <edge from-layer="2141" from-port="0" to-layer="2142" to-port="1" /> <edge from-layer="2142" from-port="2" to-layer="2143" to-port="0" /> <edge from-layer="2143" from-port="1" to-layer="2144" to-port="1" /> <edge from-layer="2144" from-port="2" to-layer="2146" to-port="0" /> <edge from-layer="2145" from-port="0" to-layer="2146" to-port="1" /> <edge from-layer="2146" from-port="2" to-layer="2147" to-port="1" /> <edge from-layer="2147" from-port="2" to-layer="2149" to-port="0" /> <edge from-layer="2147" from-port="2" to-layer="2241" to-port="0" /> <edge from-layer="2148" from-port="0" to-layer="2149" to-port="1" /> <edge from-layer="2149" from-port="2" to-layer="2151" to-port="0" /> <edge from-layer="2150" from-port="0" to-layer="2151" to-port="1" /> <edge from-layer="2151" from-port="2" to-layer="2153" to-port="0" /> <edge from-layer="2152" from-port="0" to-layer="2153" to-port="1" /> <edge from-layer="2153" from-port="2" to-layer="2164" to-port="0" /> <edge from-layer="2153" from-port="2" to-layer="2190" to-port="0" /> <edge from-layer="2153" from-port="2" to-layer="2215" to-port="0" /> <edge from-layer="2154" from-port="0" to-layer="2155" to-port="0" /> <edge from-layer="2155" from-port="1" to-layer="2158" to-port="0" /> <edge from-layer="2156" from-port="0" to-layer="2157" to-port="0" /> <edge from-layer="2157" from-port="1" to-layer="2158" to-port="1" /> <edge from-layer="2158" from-port="2" to-layer="2160" to-port="0" /> <edge from-layer="2159" from-port="0" to-layer="2160" to-port="1" /> <edge from-layer="2160" from-port="2" to-layer="2162" to-port="0" /> <edge from-layer="2161" from-port="0" to-layer="2162" to-port="1" /> <edge from-layer="2162" from-port="2" to-layer="2163" to-port="0" /> <edge from-layer="2163" from-port="1" to-layer="2164" to-port="1" /> <edge from-layer="2164" from-port="2" to-layer="2166" to-port="0" /> <edge from-layer="2165" from-port="0" to-layer="2166" to-port="1" /> <edge from-layer="2166" from-port="2" to-layer="2168" to-port="0" /> <edge from-layer="2167" from-port="0" to-layer="2168" to-port="1" /> <edge from-layer="2168" from-port="2" to-layer="2170" to-port="0" /> <edge from-layer="2169" from-port="0" to-layer="2170" to-port="1" /> <edge from-layer="2170" from-port="2" to-layer="2223" to-port="0" /> <edge from-layer="2171" from-port="0" to-layer="2176" to-port="0" /> <edge from-layer="2172" from-port="0" to-layer="2175" to-port="1" /> <edge from-layer="2173" from-port="0" to-layer="2175" to-port="2" /> <edge from-layer="2174" from-port="0" to-layer="2175" to-port="3" /> <edge from-layer="2175" from-port="4" to-layer="2176" to-port="1" /> <edge from-layer="2176" from-port="2" to-layer="2177" to-port="0" /> <edge from-layer="2177" from-port="1" to-layer="2179" to-port="0" /> <edge from-layer="2178" from-port="0" to-layer="2179" to-port="2" /> <edge from-layer="2179" from-port="3" to-layer="2195" to-port="0" /> <edge from-layer="2180" from-port="0" to-layer="2181" to-port="0" /> <edge from-layer="2181" from-port="1" to-layer="2184" to-port="0" /> <edge from-layer="2182" from-port="0" to-layer="2183" to-port="0" /> <edge from-layer="2183" from-port="1" to-layer="2184" to-port="1" /> <edge from-layer="2184" from-port="2" to-layer="2186" to-port="0" /> <edge from-layer="2185" from-port="0" to-layer="2186" to-port="1" /> <edge from-layer="2186" from-port="2" to-layer="2188" to-port="0" /> <edge from-layer="2187" from-port="0" to-layer="2188" to-port="1" /> <edge from-layer="2188" from-port="2" to-layer="2189" to-port="0" /> <edge from-layer="2189" from-port="1" to-layer="2190" to-port="1" /> <edge from-layer="2190" from-port="2" to-layer="2192" to-port="0" /> <edge from-layer="2191" from-port="0" to-layer="2192" to-port="1" /> <edge from-layer="2192" from-port="2" to-layer="2194" to-port="0" /> <edge from-layer="2193" from-port="0" to-layer="2194" to-port="1" /> <edge from-layer="2194" from-port="2" to-layer="2195" to-port="1" /> <edge from-layer="2195" from-port="2" to-layer="2542" to-port="0" /> <edge from-layer="2195" from-port="2" to-layer="2223" to-port="1" /> <edge from-layer="2196" from-port="0" to-layer="2201" to-port="0" /> <edge from-layer="2197" from-port="0" to-layer="2200" to-port="1" /> <edge from-layer="2198" from-port="0" to-layer="2200" to-port="2" /> <edge from-layer="2199" from-port="0" to-layer="2200" to-port="3" /> <edge from-layer="2200" from-port="4" to-layer="2201" to-port="1" /> <edge from-layer="2201" from-port="2" to-layer="2202" to-port="0" /> <edge from-layer="2202" from-port="1" to-layer="2204" to-port="0" /> <edge from-layer="2203" from-port="0" to-layer="2204" to-port="2" /> <edge from-layer="2204" from-port="3" to-layer="2222" to-port="0" /> <edge from-layer="2205" from-port="0" to-layer="2206" to-port="0" /> <edge from-layer="2206" from-port="1" to-layer="2209" to-port="0" /> <edge from-layer="2207" from-port="0" to-layer="2208" to-port="0" /> <edge from-layer="2208" from-port="1" to-layer="2209" to-port="1" /> <edge from-layer="2209" from-port="2" to-layer="2211" to-port="0" /> <edge from-layer="2210" from-port="0" to-layer="2211" to-port="1" /> <edge from-layer="2211" from-port="2" to-layer="2213" to-port="0" /> <edge from-layer="2212" from-port="0" to-layer="2213" to-port="1" /> <edge from-layer="2213" from-port="2" to-layer="2214" to-port="0" /> <edge from-layer="2214" from-port="1" to-layer="2215" to-port="1" /> <edge from-layer="2215" from-port="2" to-layer="2217" to-port="0" /> <edge from-layer="2216" from-port="0" to-layer="2217" to-port="1" /> <edge from-layer="2217" from-port="2" to-layer="2219" to-port="0" /> <edge from-layer="2218" from-port="0" to-layer="2219" to-port="1" /> <edge from-layer="2219" from-port="2" to-layer="2221" to-port="0" /> <edge from-layer="2220" from-port="0" to-layer="2221" to-port="1" /> <edge from-layer="2221" from-port="2" to-layer="2222" to-port="1" /> <edge from-layer="2222" from-port="2" to-layer="2541" to-port="0" /> <edge from-layer="2222" from-port="2" to-layer="2223" to-port="2" /> <edge from-layer="2223" from-port="4" to-layer="2225" to-port="0" /> <edge from-layer="2224" from-port="0" to-layer="2225" to-port="1" /> <edge from-layer="2225" from-port="2" to-layer="2227" to-port="0" /> <edge from-layer="2226" from-port="0" to-layer="2227" to-port="1" /> <edge from-layer="2227" from-port="2" to-layer="2238" to-port="0" /> <edge from-layer="2228" from-port="0" to-layer="2229" to-port="0" /> <edge from-layer="2229" from-port="1" to-layer="2232" to-port="0" /> <edge from-layer="2230" from-port="0" to-layer="2231" to-port="0" /> <edge from-layer="2231" from-port="1" to-layer="2232" to-port="1" /> <edge from-layer="2232" from-port="2" to-layer="2234" to-port="0" /> <edge from-layer="2233" from-port="0" to-layer="2234" to-port="1" /> <edge from-layer="2234" from-port="2" to-layer="2236" to-port="0" /> <edge from-layer="2235" from-port="0" to-layer="2236" to-port="1" /> <edge from-layer="2236" from-port="2" to-layer="2237" to-port="0" /> <edge from-layer="2237" from-port="1" to-layer="2238" to-port="1" /> <edge from-layer="2238" from-port="2" to-layer="2240" to-port="0" /> <edge from-layer="2239" from-port="0" to-layer="2240" to-port="1" /> <edge from-layer="2240" from-port="2" to-layer="2241" to-port="1" /> <edge from-layer="2241" from-port="2" to-layer="2283" to-port="0" /> <edge from-layer="2241" from-port="2" to-layer="2243" to-port="0" /> <edge from-layer="2242" from-port="0" to-layer="2243" to-port="1" /> <edge from-layer="2243" from-port="2" to-layer="2245" to-port="0" /> <edge from-layer="2244" from-port="0" to-layer="2245" to-port="1" /> <edge from-layer="2245" from-port="2" to-layer="2247" to-port="0" /> <edge from-layer="2246" from-port="0" to-layer="2247" to-port="1" /> <edge from-layer="2247" from-port="2" to-layer="2258" to-port="0" /> <edge from-layer="2248" from-port="0" to-layer="2249" to-port="0" /> <edge from-layer="2249" from-port="1" to-layer="2252" to-port="0" /> <edge from-layer="2250" from-port="0" to-layer="2251" to-port="0" /> <edge from-layer="2251" from-port="1" to-layer="2252" to-port="1" /> <edge from-layer="2252" from-port="2" to-layer="2254" to-port="0" /> <edge from-layer="2253" from-port="0" to-layer="2254" to-port="1" /> <edge from-layer="2254" from-port="2" to-layer="2256" to-port="0" /> <edge from-layer="2255" from-port="0" to-layer="2256" to-port="1" /> <edge from-layer="2256" from-port="2" to-layer="2257" to-port="0" /> <edge from-layer="2257" from-port="1" to-layer="2258" to-port="1" /> <edge from-layer="2258" from-port="2" to-layer="2260" to-port="0" /> <edge from-layer="2259" from-port="0" to-layer="2260" to-port="1" /> <edge from-layer="2260" from-port="2" to-layer="2262" to-port="0" /> <edge from-layer="2261" from-port="0" to-layer="2262" to-port="1" /> <edge from-layer="2262" from-port="2" to-layer="2264" to-port="0" /> <edge from-layer="2263" from-port="0" to-layer="2264" to-port="1" /> <edge from-layer="2264" from-port="2" to-layer="2265" to-port="0" /> <edge from-layer="2265" from-port="3" to-layer="2267" to-port="0" /> <edge from-layer="2266" from-port="0" to-layer="2267" to-port="1" /> <edge from-layer="2267" from-port="2" to-layer="2269" to-port="0" /> <edge from-layer="2268" from-port="0" to-layer="2269" to-port="1" /> <edge from-layer="2269" from-port="2" to-layer="2280" to-port="0" /> <edge from-layer="2270" from-port="0" to-layer="2271" to-port="0" /> <edge from-layer="2271" from-port="1" to-layer="2274" to-port="0" /> <edge from-layer="2272" from-port="0" to-layer="2273" to-port="0" /> <edge from-layer="2273" from-port="1" to-layer="2274" to-port="1" /> <edge from-layer="2274" from-port="2" to-layer="2276" to-port="0" /> <edge from-layer="2275" from-port="0" to-layer="2276" to-port="1" /> <edge from-layer="2276" from-port="2" to-layer="2278" to-port="0" /> <edge from-layer="2277" from-port="0" to-layer="2278" to-port="1" /> <edge from-layer="2278" from-port="2" to-layer="2279" to-port="0" /> <edge from-layer="2279" from-port="1" to-layer="2280" to-port="1" /> <edge from-layer="2280" from-port="2" to-layer="2282" to-port="0" /> <edge from-layer="2281" from-port="0" to-layer="2282" to-port="1" /> <edge from-layer="2282" from-port="2" to-layer="2283" to-port="1" /> <edge from-layer="2283" from-port="2" to-layer="2285" to-port="0" /> <edge from-layer="2283" from-port="2" to-layer="2317" to-port="0" /> <edge from-layer="2284" from-port="0" to-layer="2285" to-port="1" /> <edge from-layer="2285" from-port="2" to-layer="2287" to-port="0" /> <edge from-layer="2286" from-port="0" to-layer="2287" to-port="1" /> <edge from-layer="2287" from-port="2" to-layer="2289" to-port="0" /> <edge from-layer="2288" from-port="0" to-layer="2289" to-port="1" /> <edge from-layer="2289" from-port="2" to-layer="2300" to-port="0" /> <edge from-layer="2290" from-port="0" to-layer="2291" to-port="0" /> <edge from-layer="2291" from-port="1" to-layer="2294" to-port="0" /> <edge from-layer="2292" from-port="0" to-layer="2293" to-port="0" /> <edge from-layer="2293" from-port="1" to-layer="2294" to-port="1" /> <edge from-layer="2294" from-port="2" to-layer="2296" to-port="0" /> <edge from-layer="2295" from-port="0" to-layer="2296" to-port="1" /> <edge from-layer="2296" from-port="2" to-layer="2298" to-port="0" /> <edge from-layer="2297" from-port="0" to-layer="2298" to-port="1" /> <edge from-layer="2298" from-port="2" to-layer="2299" to-port="0" /> <edge from-layer="2299" from-port="1" to-layer="2300" to-port="1" /> <edge from-layer="2300" from-port="2" to-layer="2302" to-port="0" /> <edge from-layer="2301" from-port="0" to-layer="2302" to-port="1" /> <edge from-layer="2302" from-port="2" to-layer="2303" to-port="0" /> <edge from-layer="2303" from-port="1" to-layer="2314" to-port="0" /> <edge from-layer="2304" from-port="0" to-layer="2305" to-port="0" /> <edge from-layer="2305" from-port="1" to-layer="2308" to-port="0" /> <edge from-layer="2306" from-port="0" to-layer="2307" to-port="0" /> <edge from-layer="2307" from-port="1" to-layer="2308" to-port="1" /> <edge from-layer="2308" from-port="2" to-layer="2310" to-port="0" /> <edge from-layer="2309" from-port="0" to-layer="2310" to-port="1" /> <edge from-layer="2310" from-port="2" to-layer="2312" to-port="0" /> <edge from-layer="2311" from-port="0" to-layer="2312" to-port="1" /> <edge from-layer="2312" from-port="2" to-layer="2313" to-port="0" /> <edge from-layer="2313" from-port="1" to-layer="2314" to-port="1" /> <edge from-layer="2314" from-port="2" to-layer="2316" to-port="0" /> <edge from-layer="2315" from-port="0" to-layer="2316" to-port="1" /> <edge from-layer="2316" from-port="2" to-layer="2317" to-port="1" /> <edge from-layer="2317" from-port="2" to-layer="2411" to-port="0" /> <edge from-layer="2317" from-port="2" to-layer="2319" to-port="0" /> <edge from-layer="2318" from-port="0" to-layer="2319" to-port="1" /> <edge from-layer="2319" from-port="2" to-layer="2321" to-port="0" /> <edge from-layer="2320" from-port="0" to-layer="2321" to-port="1" /> <edge from-layer="2321" from-port="2" to-layer="2323" to-port="0" /> <edge from-layer="2322" from-port="0" to-layer="2323" to-port="1" /> <edge from-layer="2323" from-port="2" to-layer="2360" to-port="0" /> <edge from-layer="2323" from-port="2" to-layer="2334" to-port="0" /> <edge from-layer="2323" from-port="2" to-layer="2385" to-port="0" /> <edge from-layer="2324" from-port="0" to-layer="2325" to-port="0" /> <edge from-layer="2325" from-port="1" to-layer="2328" to-port="0" /> <edge from-layer="2326" from-port="0" to-layer="2327" to-port="0" /> <edge from-layer="2327" from-port="1" to-layer="2328" to-port="1" /> <edge from-layer="2328" from-port="2" to-layer="2330" to-port="0" /> <edge from-layer="2329" from-port="0" to-layer="2330" to-port="1" /> <edge from-layer="2330" from-port="2" to-layer="2332" to-port="0" /> <edge from-layer="2331" from-port="0" to-layer="2332" to-port="1" /> <edge from-layer="2332" from-port="2" to-layer="2333" to-port="0" /> <edge from-layer="2333" from-port="1" to-layer="2334" to-port="1" /> <edge from-layer="2334" from-port="2" to-layer="2336" to-port="0" /> <edge from-layer="2335" from-port="0" to-layer="2336" to-port="1" /> <edge from-layer="2336" from-port="2" to-layer="2338" to-port="0" /> <edge from-layer="2337" from-port="0" to-layer="2338" to-port="1" /> <edge from-layer="2338" from-port="2" to-layer="2340" to-port="0" /> <edge from-layer="2339" from-port="0" to-layer="2340" to-port="1" /> <edge from-layer="2340" from-port="2" to-layer="2393" to-port="0" /> <edge from-layer="2341" from-port="0" to-layer="2346" to-port="0" /> <edge from-layer="2342" from-port="0" to-layer="2345" to-port="1" /> <edge from-layer="2343" from-port="0" to-layer="2345" to-port="2" /> <edge from-layer="2344" from-port="0" to-layer="2345" to-port="3" /> <edge from-layer="2345" from-port="4" to-layer="2346" to-port="1" /> <edge from-layer="2346" from-port="2" to-layer="2347" to-port="0" /> <edge from-layer="2347" from-port="1" to-layer="2349" to-port="0" /> <edge from-layer="2348" from-port="0" to-layer="2349" to-port="2" /> <edge from-layer="2349" from-port="3" to-layer="2365" to-port="0" /> <edge from-layer="2350" from-port="0" to-layer="2351" to-port="0" /> <edge from-layer="2351" from-port="1" to-layer="2354" to-port="0" /> <edge from-layer="2352" from-port="0" to-layer="2353" to-port="0" /> <edge from-layer="2353" from-port="1" to-layer="2354" to-port="1" /> <edge from-layer="2354" from-port="2" to-layer="2356" to-port="0" /> <edge from-layer="2355" from-port="0" to-layer="2356" to-port="1" /> <edge from-layer="2356" from-port="2" to-layer="2358" to-port="0" /> <edge from-layer="2357" from-port="0" to-layer="2358" to-port="1" /> <edge from-layer="2358" from-port="2" to-layer="2359" to-port="0" /> <edge from-layer="2359" from-port="1" to-layer="2360" to-port="1" /> <edge from-layer="2360" from-port="2" to-layer="2362" to-port="0" /> <edge from-layer="2361" from-port="0" to-layer="2362" to-port="1" /> <edge from-layer="2362" from-port="2" to-layer="2364" to-port="0" /> <edge from-layer="2363" from-port="0" to-layer="2364" to-port="1" /> <edge from-layer="2364" from-port="2" to-layer="2365" to-port="1" /> <edge from-layer="2365" from-port="2" to-layer="2393" to-port="1" /> <edge from-layer="2365" from-port="2" to-layer="2540" to-port="0" /> <edge from-layer="2366" from-port="0" to-layer="2371" to-port="0" /> <edge from-layer="2367" from-port="0" to-layer="2370" to-port="1" /> <edge from-layer="2368" from-port="0" to-layer="2370" to-port="2" /> <edge from-layer="2369" from-port="0" to-layer="2370" to-port="3" /> <edge from-layer="2370" from-port="4" to-layer="2371" to-port="1" /> <edge from-layer="2371" from-port="2" to-layer="2372" to-port="0" /> <edge from-layer="2372" from-port="1" to-layer="2374" to-port="0" /> <edge from-layer="2373" from-port="0" to-layer="2374" to-port="2" /> <edge from-layer="2374" from-port="3" to-layer="2392" to-port="0" /> <edge from-layer="2375" from-port="0" to-layer="2376" to-port="0" /> <edge from-layer="2376" from-port="1" to-layer="2379" to-port="0" /> <edge from-layer="2377" from-port="0" to-layer="2378" to-port="0" /> <edge from-layer="2378" from-port="1" to-layer="2379" to-port="1" /> <edge from-layer="2379" from-port="2" to-layer="2381" to-port="0" /> <edge from-layer="2380" from-port="0" to-layer="2381" to-port="1" /> <edge from-layer="2381" from-port="2" to-layer="2383" to-port="0" /> <edge from-layer="2382" from-port="0" to-layer="2383" to-port="1" /> <edge from-layer="2383" from-port="2" to-layer="2384" to-port="0" /> <edge from-layer="2384" from-port="1" to-layer="2385" to-port="1" /> <edge from-layer="2385" from-port="2" to-layer="2387" to-port="0" /> <edge from-layer="2386" from-port="0" to-layer="2387" to-port="1" /> <edge from-layer="2387" from-port="2" to-layer="2389" to-port="0" /> <edge from-layer="2388" from-port="0" to-layer="2389" to-port="1" /> <edge from-layer="2389" from-port="2" to-layer="2391" to-port="0" /> <edge from-layer="2390" from-port="0" to-layer="2391" to-port="1" /> <edge from-layer="2391" from-port="2" to-layer="2392" to-port="1" /> <edge from-layer="2392" from-port="2" to-layer="2393" to-port="2" /> <edge from-layer="2392" from-port="2" to-layer="2539" to-port="0" /> <edge from-layer="2393" from-port="4" to-layer="2395" to-port="0" /> <edge from-layer="2394" from-port="0" to-layer="2395" to-port="1" /> <edge from-layer="2395" from-port="2" to-layer="2397" to-port="0" /> <edge from-layer="2396" from-port="0" to-layer="2397" to-port="1" /> <edge from-layer="2397" from-port="2" to-layer="2408" to-port="0" /> <edge from-layer="2398" from-port="0" to-layer="2399" to-port="0" /> <edge from-layer="2399" from-port="1" to-layer="2402" to-port="0" /> <edge from-layer="2400" from-port="0" to-layer="2401" to-port="0" /> <edge from-layer="2401" from-port="1" to-layer="2402" to-port="1" /> <edge from-layer="2402" from-port="2" to-layer="2404" to-port="0" /> <edge from-layer="2403" from-port="0" to-layer="2404" to-port="1" /> <edge from-layer="2404" from-port="2" to-layer="2406" to-port="0" /> <edge from-layer="2405" from-port="0" to-layer="2406" to-port="1" /> <edge from-layer="2406" from-port="2" to-layer="2407" to-port="0" /> <edge from-layer="2407" from-port="1" to-layer="2408" to-port="1" /> <edge from-layer="2408" from-port="2" to-layer="2410" to-port="0" /> <edge from-layer="2409" from-port="0" to-layer="2410" to-port="1" /> <edge from-layer="2410" from-port="2" to-layer="2411" to-port="1" /> <edge from-layer="2411" from-port="2" to-layer="2453" to-port="0" /> <edge from-layer="2411" from-port="2" to-layer="2413" to-port="0" /> <edge from-layer="2412" from-port="0" to-layer="2413" to-port="1" /> <edge from-layer="2413" from-port="2" to-layer="2415" to-port="0" /> <edge from-layer="2414" from-port="0" to-layer="2415" to-port="1" /> <edge from-layer="2415" from-port="2" to-layer="2417" to-port="0" /> <edge from-layer="2416" from-port="0" to-layer="2417" to-port="1" /> <edge from-layer="2417" from-port="2" to-layer="2428" to-port="0" /> <edge from-layer="2418" from-port="0" to-layer="2419" to-port="0" /> <edge from-layer="2419" from-port="1" to-layer="2422" to-port="0" /> <edge from-layer="2420" from-port="0" to-layer="2421" to-port="0" /> <edge from-layer="2421" from-port="1" to-layer="2422" to-port="1" /> <edge from-layer="2422" from-port="2" to-layer="2424" to-port="0" /> <edge from-layer="2423" from-port="0" to-layer="2424" to-port="1" /> <edge from-layer="2424" from-port="2" to-layer="2426" to-port="0" /> <edge from-layer="2425" from-port="0" to-layer="2426" to-port="1" /> <edge from-layer="2426" from-port="2" to-layer="2427" to-port="0" /> <edge from-layer="2427" from-port="1" to-layer="2428" to-port="1" /> <edge from-layer="2428" from-port="2" to-layer="2430" to-port="0" /> <edge from-layer="2429" from-port="0" to-layer="2430" to-port="1" /> <edge from-layer="2430" from-port="2" to-layer="2432" to-port="0" /> <edge from-layer="2431" from-port="0" to-layer="2432" to-port="1" /> <edge from-layer="2432" from-port="2" to-layer="2434" to-port="0" /> <edge from-layer="2433" from-port="0" to-layer="2434" to-port="1" /> <edge from-layer="2434" from-port="2" to-layer="2435" to-port="0" /> <edge from-layer="2435" from-port="3" to-layer="2437" to-port="0" /> <edge from-layer="2436" from-port="0" to-layer="2437" to-port="1" /> <edge from-layer="2437" from-port="2" to-layer="2439" to-port="0" /> <edge from-layer="2438" from-port="0" to-layer="2439" to-port="1" /> <edge from-layer="2439" from-port="2" to-layer="2450" to-port="0" /> <edge from-layer="2440" from-port="0" to-layer="2441" to-port="0" /> <edge from-layer="2441" from-port="1" to-layer="2444" to-port="0" /> <edge from-layer="2442" from-port="0" to-layer="2443" to-port="0" /> <edge from-layer="2443" from-port="1" to-layer="2444" to-port="1" /> <edge from-layer="2444" from-port="2" to-layer="2446" to-port="0" /> <edge from-layer="2445" from-port="0" to-layer="2446" to-port="1" /> <edge from-layer="2446" from-port="2" to-layer="2448" to-port="0" /> <edge from-layer="2447" from-port="0" to-layer="2448" to-port="1" /> <edge from-layer="2448" from-port="2" to-layer="2449" to-port="0" /> <edge from-layer="2449" from-port="1" to-layer="2450" to-port="1" /> <edge from-layer="2450" from-port="2" to-layer="2452" to-port="0" /> <edge from-layer="2451" from-port="0" to-layer="2452" to-port="1" /> <edge from-layer="2452" from-port="2" to-layer="2453" to-port="1" /> <edge from-layer="2453" from-port="2" to-layer="2455" to-port="0" /> <edge from-layer="2453" from-port="2" to-layer="2487" to-port="0" /> <edge from-layer="2454" from-port="0" to-layer="2455" to-port="1" /> <edge from-layer="2455" from-port="2" to-layer="2457" to-port="0" /> <edge from-layer="2456" from-port="0" to-layer="2457" to-port="1" /> <edge from-layer="2457" from-port="2" to-layer="2459" to-port="0" /> <edge from-layer="2458" from-port="0" to-layer="2459" to-port="1" /> <edge from-layer="2459" from-port="2" to-layer="2470" to-port="0" /> <edge from-layer="2460" from-port="0" to-layer="2461" to-port="0" /> <edge from-layer="2461" from-port="1" to-layer="2464" to-port="0" /> <edge from-layer="2462" from-port="0" to-layer="2463" to-port="0" /> <edge from-layer="2463" from-port="1" to-layer="2464" to-port="1" /> <edge from-layer="2464" from-port="2" to-layer="2466" to-port="0" /> <edge from-layer="2465" from-port="0" to-layer="2466" to-port="1" /> <edge from-layer="2466" from-port="2" to-layer="2468" to-port="0" /> <edge from-layer="2467" from-port="0" to-layer="2468" to-port="1" /> <edge from-layer="2468" from-port="2" to-layer="2469" to-port="0" /> <edge from-layer="2469" from-port="1" to-layer="2470" to-port="1" /> <edge from-layer="2470" from-port="2" to-layer="2472" to-port="0" /> <edge from-layer="2471" from-port="0" to-layer="2472" to-port="1" /> <edge from-layer="2472" from-port="2" to-layer="2473" to-port="0" /> <edge from-layer="2473" from-port="1" to-layer="2484" to-port="0" /> <edge from-layer="2474" from-port="0" to-layer="2475" to-port="0" /> <edge from-layer="2475" from-port="1" to-layer="2478" to-port="0" /> <edge from-layer="2476" from-port="0" to-layer="2477" to-port="0" /> <edge from-layer="2477" from-port="1" to-layer="2478" to-port="1" /> <edge from-layer="2478" from-port="2" to-layer="2480" to-port="0" /> <edge from-layer="2479" from-port="0" to-layer="2480" to-port="1" /> <edge from-layer="2480" from-port="2" to-layer="2482" to-port="0" /> <edge from-layer="2481" from-port="0" to-layer="2482" to-port="1" /> <edge from-layer="2482" from-port="2" to-layer="2483" to-port="0" /> <edge from-layer="2483" from-port="1" to-layer="2484" to-port="1" /> <edge from-layer="2484" from-port="2" to-layer="2486" to-port="0" /> <edge from-layer="2485" from-port="0" to-layer="2486" to-port="1" /> <edge from-layer="2486" from-port="2" to-layer="2487" to-port="1" /> <edge from-layer="2487" from-port="2" to-layer="2595" to-port="0" /> <edge from-layer="2487" from-port="2" to-layer="2489" to-port="0" /> <edge from-layer="2488" from-port="0" to-layer="2489" to-port="1" /> <edge from-layer="2489" from-port="2" to-layer="2491" to-port="0" /> <edge from-layer="2490" from-port="0" to-layer="2491" to-port="1" /> <edge from-layer="2491" from-port="2" to-layer="2493" to-port="0" /> <edge from-layer="2492" from-port="0" to-layer="2493" to-port="1" /> <edge from-layer="2493" from-port="2" to-layer="2570" to-port="0" /> <edge from-layer="2493" from-port="2" to-layer="2532" to-port="0" /> <edge from-layer="2493" from-port="2" to-layer="2504" to-port="0" /> <edge from-layer="2494" from-port="0" to-layer="2495" to-port="0" /> <edge from-layer="2495" from-port="1" to-layer="2498" to-port="0" /> <edge from-layer="2496" from-port="0" to-layer="2497" to-port="0" /> <edge from-layer="2497" from-port="1" to-layer="2498" to-port="1" /> <edge from-layer="2498" from-port="2" to-layer="2500" to-port="0" /> <edge from-layer="2499" from-port="0" to-layer="2500" to-port="1" /> <edge from-layer="2500" from-port="2" to-layer="2502" to-port="0" /> <edge from-layer="2501" from-port="0" to-layer="2502" to-port="1" /> <edge from-layer="2502" from-port="2" to-layer="2503" to-port="0" /> <edge from-layer="2503" from-port="1" to-layer="2504" to-port="1" /> <edge from-layer="2504" from-port="2" to-layer="2506" to-port="0" /> <edge from-layer="2505" from-port="0" to-layer="2506" to-port="1" /> <edge from-layer="2506" from-port="2" to-layer="2508" to-port="0" /> <edge from-layer="2507" from-port="0" to-layer="2508" to-port="1" /> <edge from-layer="2508" from-port="2" to-layer="2510" to-port="0" /> <edge from-layer="2509" from-port="0" to-layer="2510" to-port="1" /> <edge from-layer="2510" from-port="2" to-layer="2511" to-port="1" /> <edge from-layer="2511" from-port="2" to-layer="2512" to-port="0" /> <edge from-layer="2511" from-port="2" to-layer="2577" to-port="2" /> <edge from-layer="2513" from-port="0" to-layer="2518" to-port="0" /> <edge from-layer="2514" from-port="0" to-layer="2517" to-port="1" /> <edge from-layer="2515" from-port="0" to-layer="2517" to-port="2" /> <edge from-layer="2516" from-port="0" to-layer="2517" to-port="3" /> <edge from-layer="2517" from-port="4" to-layer="2518" to-port="1" /> <edge from-layer="2518" from-port="2" to-layer="2519" to-port="0" /> <edge from-layer="2519" from-port="1" to-layer="2521" to-port="0" /> <edge from-layer="2520" from-port="0" to-layer="2521" to-port="2" /> <edge from-layer="2521" from-port="3" to-layer="2537" to-port="0" /> <edge from-layer="2522" from-port="0" to-layer="2523" to-port="0" /> <edge from-layer="2523" from-port="1" to-layer="2526" to-port="0" /> <edge from-layer="2524" from-port="0" to-layer="2525" to-port="0" /> <edge from-layer="2525" from-port="1" to-layer="2526" to-port="1" /> <edge from-layer="2526" from-port="2" to-layer="2528" to-port="0" /> <edge from-layer="2527" from-port="0" to-layer="2528" to-port="1" /> <edge from-layer="2528" from-port="2" to-layer="2530" to-port="0" /> <edge from-layer="2529" from-port="0" to-layer="2530" to-port="1" /> <edge from-layer="2530" from-port="2" to-layer="2531" to-port="0" /> <edge from-layer="2531" from-port="1" to-layer="2532" to-port="1" /> <edge from-layer="2532" from-port="2" to-layer="2534" to-port="0" /> <edge from-layer="2533" from-port="0" to-layer="2534" to-port="1" /> <edge from-layer="2534" from-port="2" to-layer="2536" to-port="0" /> <edge from-layer="2535" from-port="0" to-layer="2536" to-port="1" /> <edge from-layer="2536" from-port="2" to-layer="2537" to-port="1" /> <edge from-layer="2537" from-port="2" to-layer="2538" to-port="0" /> <edge from-layer="2537" from-port="2" to-layer="2577" to-port="1" /> <edge from-layer="2551" from-port="0" to-layer="2556" to-port="0" /> <edge from-layer="2552" from-port="0" to-layer="2555" to-port="1" /> <edge from-layer="2553" from-port="0" to-layer="2555" to-port="2" /> <edge from-layer="2554" from-port="0" to-layer="2555" to-port="3" /> <edge from-layer="2555" from-port="4" to-layer="2556" to-port="1" /> <edge from-layer="2556" from-port="2" to-layer="2557" to-port="0" /> <edge from-layer="2557" from-port="1" to-layer="2559" to-port="0" /> <edge from-layer="2558" from-port="0" to-layer="2559" to-port="2" /> <edge from-layer="2559" from-port="3" to-layer="4905" to-port="0" /> <edge from-layer="2560" from-port="0" to-layer="2561" to-port="0" /> <edge from-layer="2561" from-port="1" to-layer="2564" to-port="0" /> <edge from-layer="2562" from-port="0" to-layer="2563" to-port="0" /> <edge from-layer="2563" from-port="1" to-layer="2564" to-port="1" /> <edge from-layer="2564" from-port="2" to-layer="2566" to-port="0" /> <edge from-layer="2565" from-port="0" to-layer="2566" to-port="1" /> <edge from-layer="2566" from-port="2" to-layer="2568" to-port="0" /> <edge from-layer="2567" from-port="0" to-layer="2568" to-port="1" /> <edge from-layer="2568" from-port="2" to-layer="2569" to-port="0" /> <edge from-layer="2569" from-port="1" to-layer="2570" to-port="1" /> <edge from-layer="2570" from-port="2" to-layer="2572" to-port="0" /> <edge from-layer="2571" from-port="0" to-layer="2572" to-port="1" /> <edge from-layer="2572" from-port="2" to-layer="2574" to-port="0" /> <edge from-layer="2573" from-port="0" to-layer="2574" to-port="1" /> <edge from-layer="2574" from-port="2" to-layer="2576" to-port="0" /> <edge from-layer="2575" from-port="0" to-layer="2576" to-port="1" /> <edge from-layer="2576" from-port="2" to-layer="2577" to-port="0" /> <edge from-layer="2577" from-port="4" to-layer="2579" to-port="0" /> <edge from-layer="2578" from-port="0" to-layer="2579" to-port="1" /> <edge from-layer="2579" from-port="2" to-layer="2581" to-port="0" /> <edge from-layer="2580" from-port="0" to-layer="2581" to-port="1" /> <edge from-layer="2581" from-port="2" to-layer="2592" to-port="0" /> <edge from-layer="2582" from-port="0" to-layer="2583" to-port="0" /> <edge from-layer="2583" from-port="1" to-layer="2586" to-port="0" /> <edge from-layer="2584" from-port="0" to-layer="2585" to-port="0" /> <edge from-layer="2585" from-port="1" to-layer="2586" to-port="1" /> <edge from-layer="2586" from-port="2" to-layer="2588" to-port="0" /> <edge from-layer="2587" from-port="0" to-layer="2588" to-port="1" /> <edge from-layer="2588" from-port="2" to-layer="2590" to-port="0" /> <edge from-layer="2589" from-port="0" to-layer="2590" to-port="1" /> <edge from-layer="2590" from-port="2" to-layer="2591" to-port="0" /> <edge from-layer="2591" from-port="1" to-layer="2592" to-port="1" /> <edge from-layer="2592" from-port="2" to-layer="2594" to-port="0" /> <edge from-layer="2593" from-port="0" to-layer="2594" to-port="1" /> <edge from-layer="2594" from-port="2" to-layer="2595" to-port="1" /> <edge from-layer="2595" from-port="2" to-layer="2597" to-port="0" /> <edge from-layer="2595" from-port="2" to-layer="2637" to-port="0" /> <edge from-layer="2596" from-port="0" to-layer="2597" to-port="1" /> <edge from-layer="2597" from-port="2" to-layer="2599" to-port="0" /> <edge from-layer="2598" from-port="0" to-layer="2599" to-port="1" /> <edge from-layer="2599" from-port="2" to-layer="2601" to-port="0" /> <edge from-layer="2600" from-port="0" to-layer="2601" to-port="1" /> <edge from-layer="2601" from-port="2" to-layer="2612" to-port="0" /> <edge from-layer="2602" from-port="0" to-layer="2603" to-port="0" /> <edge from-layer="2603" from-port="1" to-layer="2606" to-port="0" /> <edge from-layer="2604" from-port="0" to-layer="2605" to-port="0" /> <edge from-layer="2605" from-port="1" to-layer="2606" to-port="1" /> <edge from-layer="2606" from-port="2" to-layer="2608" to-port="0" /> <edge from-layer="2607" from-port="0" to-layer="2608" to-port="1" /> <edge from-layer="2608" from-port="2" to-layer="2610" to-port="0" /> <edge from-layer="2609" from-port="0" to-layer="2610" to-port="1" /> <edge from-layer="2610" from-port="2" to-layer="2611" to-port="0" /> <edge from-layer="2611" from-port="1" to-layer="2612" to-port="1" /> <edge from-layer="2612" from-port="2" to-layer="2614" to-port="0" /> <edge from-layer="2613" from-port="0" to-layer="2614" to-port="1" /> <edge from-layer="2614" from-port="2" to-layer="2616" to-port="0" /> <edge from-layer="2615" from-port="0" to-layer="2616" to-port="1" /> <edge from-layer="2616" from-port="2" to-layer="2618" to-port="0" /> <edge from-layer="2617" from-port="0" to-layer="2618" to-port="1" /> <edge from-layer="2618" from-port="2" to-layer="2619" to-port="0" /> <edge from-layer="2619" from-port="3" to-layer="2621" to-port="0" /> <edge from-layer="2620" from-port="0" to-layer="2621" to-port="1" /> <edge from-layer="2621" from-port="2" to-layer="2623" to-port="0" /> <edge from-layer="2622" from-port="0" to-layer="2623" to-port="1" /> <edge from-layer="2623" from-port="2" to-layer="2634" to-port="0" /> <edge from-layer="2624" from-port="0" to-layer="2625" to-port="0" /> <edge from-layer="2625" from-port="1" to-layer="2628" to-port="0" /> <edge from-layer="2626" from-port="0" to-layer="2627" to-port="0" /> <edge from-layer="2627" from-port="1" to-layer="2628" to-port="1" /> <edge from-layer="2628" from-port="2" to-layer="2630" to-port="0" /> <edge from-layer="2629" from-port="0" to-layer="2630" to-port="1" /> <edge from-layer="2630" from-port="2" to-layer="2632" to-port="0" /> <edge from-layer="2631" from-port="0" to-layer="2632" to-port="1" /> <edge from-layer="2632" from-port="2" to-layer="2633" to-port="0" /> <edge from-layer="2633" from-port="1" to-layer="2634" to-port="1" /> <edge from-layer="2634" from-port="2" to-layer="2636" to-port="0" /> <edge from-layer="2635" from-port="0" to-layer="2636" to-port="1" /> <edge from-layer="2636" from-port="2" to-layer="2637" to-port="1" /> <edge from-layer="2637" from-port="2" to-layer="2639" to-port="0" /> <edge from-layer="2637" from-port="2" to-layer="2671" to-port="0" /> <edge from-layer="2638" from-port="0" to-layer="2639" to-port="1" /> <edge from-layer="2639" from-port="2" to-layer="2641" to-port="0" /> <edge from-layer="2640" from-port="0" to-layer="2641" to-port="1" /> <edge from-layer="2641" from-port="2" to-layer="2643" to-port="0" /> <edge from-layer="2642" from-port="0" to-layer="2643" to-port="1" /> <edge from-layer="2643" from-port="2" to-layer="2654" to-port="0" /> <edge from-layer="2644" from-port="0" to-layer="2645" to-port="0" /> <edge from-layer="2645" from-port="1" to-layer="2648" to-port="0" /> <edge from-layer="2646" from-port="0" to-layer="2647" to-port="0" /> <edge from-layer="2647" from-port="1" to-layer="2648" to-port="1" /> <edge from-layer="2648" from-port="2" to-layer="2650" to-port="0" /> <edge from-layer="2649" from-port="0" to-layer="2650" to-port="1" /> <edge from-layer="2650" from-port="2" to-layer="2652" to-port="0" /> <edge from-layer="2651" from-port="0" to-layer="2652" to-port="1" /> <edge from-layer="2652" from-port="2" to-layer="2653" to-port="0" /> <edge from-layer="2653" from-port="1" to-layer="2654" to-port="1" /> <edge from-layer="2654" from-port="2" to-layer="2656" to-port="0" /> <edge from-layer="2655" from-port="0" to-layer="2656" to-port="1" /> <edge from-layer="2656" from-port="2" to-layer="2657" to-port="0" /> <edge from-layer="2657" from-port="1" to-layer="2668" to-port="0" /> <edge from-layer="2658" from-port="0" to-layer="2659" to-port="0" /> <edge from-layer="2659" from-port="1" to-layer="2662" to-port="0" /> <edge from-layer="2660" from-port="0" to-layer="2661" to-port="0" /> <edge from-layer="2661" from-port="1" to-layer="2662" to-port="1" /> <edge from-layer="2662" from-port="2" to-layer="2664" to-port="0" /> <edge from-layer="2663" from-port="0" to-layer="2664" to-port="1" /> <edge from-layer="2664" from-port="2" to-layer="2666" to-port="0" /> <edge from-layer="2665" from-port="0" to-layer="2666" to-port="1" /> <edge from-layer="2666" from-port="2" to-layer="2667" to-port="0" /> <edge from-layer="2667" from-port="1" to-layer="2668" to-port="1" /> <edge from-layer="2668" from-port="2" to-layer="2670" to-port="0" /> <edge from-layer="2669" from-port="0" to-layer="2670" to-port="1" /> <edge from-layer="2670" from-port="2" to-layer="2671" to-port="1" /> <edge from-layer="2671" from-port="2" to-layer="2765" to-port="0" /> <edge from-layer="2671" from-port="2" to-layer="2673" to-port="0" /> <edge from-layer="2672" from-port="0" to-layer="2673" to-port="1" /> <edge from-layer="2673" from-port="2" to-layer="2675" to-port="0" /> <edge from-layer="2674" from-port="0" to-layer="2675" to-port="1" /> <edge from-layer="2675" from-port="2" to-layer="2677" to-port="0" /> <edge from-layer="2676" from-port="0" to-layer="2677" to-port="1" /> <edge from-layer="2677" from-port="2" to-layer="2714" to-port="0" /> <edge from-layer="2677" from-port="2" to-layer="2739" to-port="0" /> <edge from-layer="2677" from-port="2" to-layer="2688" to-port="0" /> <edge from-layer="2678" from-port="0" to-layer="2679" to-port="0" /> <edge from-layer="2679" from-port="1" to-layer="2682" to-port="0" /> <edge from-layer="2680" from-port="0" to-layer="2681" to-port="0" /> <edge from-layer="2681" from-port="1" to-layer="2682" to-port="1" /> <edge from-layer="2682" from-port="2" to-layer="2684" to-port="0" /> <edge from-layer="2683" from-port="0" to-layer="2684" to-port="1" /> <edge from-layer="2684" from-port="2" to-layer="2686" to-port="0" /> <edge from-layer="2685" from-port="0" to-layer="2686" to-port="1" /> <edge from-layer="2686" from-port="2" to-layer="2687" to-port="0" /> <edge from-layer="2687" from-port="1" to-layer="2688" to-port="1" /> <edge from-layer="2688" from-port="2" to-layer="2690" to-port="0" /> <edge from-layer="2689" from-port="0" to-layer="2690" to-port="1" /> <edge from-layer="2690" from-port="2" to-layer="2692" to-port="0" /> <edge from-layer="2691" from-port="0" to-layer="2692" to-port="1" /> <edge from-layer="2692" from-port="2" to-layer="2694" to-port="0" /> <edge from-layer="2693" from-port="0" to-layer="2694" to-port="1" /> <edge from-layer="2694" from-port="2" to-layer="2747" to-port="0" /> <edge from-layer="2695" from-port="0" to-layer="2700" to-port="0" /> <edge from-layer="2696" from-port="0" to-layer="2699" to-port="1" /> <edge from-layer="2697" from-port="0" to-layer="2699" to-port="2" /> <edge from-layer="2698" from-port="0" to-layer="2699" to-port="3" /> <edge from-layer="2699" from-port="4" to-layer="2700" to-port="1" /> <edge from-layer="2700" from-port="2" to-layer="2701" to-port="0" /> <edge from-layer="2701" from-port="1" to-layer="2703" to-port="0" /> <edge from-layer="2702" from-port="0" to-layer="2703" to-port="2" /> <edge from-layer="2703" from-port="3" to-layer="2719" to-port="0" /> <edge from-layer="2704" from-port="0" to-layer="2705" to-port="0" /> <edge from-layer="2705" from-port="1" to-layer="2708" to-port="0" /> <edge from-layer="2706" from-port="0" to-layer="2707" to-port="0" /> <edge from-layer="2707" from-port="1" to-layer="2708" to-port="1" /> <edge from-layer="2708" from-port="2" to-layer="2710" to-port="0" /> <edge from-layer="2709" from-port="0" to-layer="2710" to-port="1" /> <edge from-layer="2710" from-port="2" to-layer="2712" to-port="0" /> <edge from-layer="2711" from-port="0" to-layer="2712" to-port="1" /> <edge from-layer="2712" from-port="2" to-layer="2713" to-port="0" /> <edge from-layer="2713" from-port="1" to-layer="2714" to-port="1" /> <edge from-layer="2714" from-port="2" to-layer="2716" to-port="0" /> <edge from-layer="2715" from-port="0" to-layer="2716" to-port="1" /> <edge from-layer="2716" from-port="2" to-layer="2718" to-port="0" /> <edge from-layer="2717" from-port="0" to-layer="2718" to-port="1" /> <edge from-layer="2718" from-port="2" to-layer="2719" to-port="1" /> <edge from-layer="2719" from-port="2" to-layer="4960" to-port="0" /> <edge from-layer="2719" from-port="2" to-layer="2747" to-port="1" /> <edge from-layer="2720" from-port="0" to-layer="2725" to-port="0" /> <edge from-layer="2721" from-port="0" to-layer="2724" to-port="1" /> <edge from-layer="2722" from-port="0" to-layer="2724" to-port="2" /> <edge from-layer="2723" from-port="0" to-layer="2724" to-port="3" /> <edge from-layer="2724" from-port="4" to-layer="2725" to-port="1" /> <edge from-layer="2725" from-port="2" to-layer="2726" to-port="0" /> <edge from-layer="2726" from-port="1" to-layer="2728" to-port="0" /> <edge from-layer="2727" from-port="0" to-layer="2728" to-port="2" /> <edge from-layer="2728" from-port="3" to-layer="2746" to-port="0" /> <edge from-layer="2729" from-port="0" to-layer="2730" to-port="0" /> <edge from-layer="2730" from-port="1" to-layer="2733" to-port="0" /> <edge from-layer="2731" from-port="0" to-layer="2732" to-port="0" /> <edge from-layer="2732" from-port="1" to-layer="2733" to-port="1" /> <edge from-layer="2733" from-port="2" to-layer="2735" to-port="0" /> <edge from-layer="2734" from-port="0" to-layer="2735" to-port="1" /> <edge from-layer="2735" from-port="2" to-layer="2737" to-port="0" /> <edge from-layer="2736" from-port="0" to-layer="2737" to-port="1" /> <edge from-layer="2737" from-port="2" to-layer="2738" to-port="0" /> <edge from-layer="2738" from-port="1" to-layer="2739" to-port="1" /> <edge from-layer="2739" from-port="2" to-layer="2741" to-port="0" /> <edge from-layer="2740" from-port="0" to-layer="2741" to-port="1" /> <edge from-layer="2741" from-port="2" to-layer="2743" to-port="0" /> <edge from-layer="2742" from-port="0" to-layer="2743" to-port="1" /> <edge from-layer="2743" from-port="2" to-layer="2745" to-port="0" /> <edge from-layer="2744" from-port="0" to-layer="2745" to-port="1" /> <edge from-layer="2745" from-port="2" to-layer="2746" to-port="1" /> <edge from-layer="2746" from-port="2" to-layer="2747" to-port="2" /> <edge from-layer="2746" from-port="2" to-layer="4959" to-port="0" /> <edge from-layer="2747" from-port="4" to-layer="2749" to-port="0" /> <edge from-layer="2748" from-port="0" to-layer="2749" to-port="1" /> <edge from-layer="2749" from-port="2" to-layer="2751" to-port="0" /> <edge from-layer="2750" from-port="0" to-layer="2751" to-port="1" /> <edge from-layer="2751" from-port="2" to-layer="2762" to-port="0" /> <edge from-layer="2752" from-port="0" to-layer="2753" to-port="0" /> <edge from-layer="2753" from-port="1" to-layer="2756" to-port="0" /> <edge from-layer="2754" from-port="0" to-layer="2755" to-port="0" /> <edge from-layer="2755" from-port="1" to-layer="2756" to-port="1" /> <edge from-layer="2756" from-port="2" to-layer="2758" to-port="0" /> <edge from-layer="2757" from-port="0" to-layer="2758" to-port="1" /> <edge from-layer="2758" from-port="2" to-layer="2760" to-port="0" /> <edge from-layer="2759" from-port="0" to-layer="2760" to-port="1" /> <edge from-layer="2760" from-port="2" to-layer="2761" to-port="0" /> <edge from-layer="2761" from-port="1" to-layer="2762" to-port="1" /> <edge from-layer="2762" from-port="2" to-layer="2764" to-port="0" /> <edge from-layer="2763" from-port="0" to-layer="2764" to-port="1" /> <edge from-layer="2764" from-port="2" to-layer="2765" to-port="1" /> <edge from-layer="2765" from-port="2" to-layer="2807" to-port="0" /> <edge from-layer="2765" from-port="2" to-layer="2767" to-port="0" /> <edge from-layer="2766" from-port="0" to-layer="2767" to-port="1" /> <edge from-layer="2767" from-port="2" to-layer="2769" to-port="0" /> <edge from-layer="2768" from-port="0" to-layer="2769" to-port="1" /> <edge from-layer="2769" from-port="2" to-layer="2771" to-port="0" /> <edge from-layer="2770" from-port="0" to-layer="2771" to-port="1" /> <edge from-layer="2771" from-port="2" to-layer="2782" to-port="0" /> <edge from-layer="2772" from-port="0" to-layer="2773" to-port="0" /> <edge from-layer="2773" from-port="1" to-layer="2776" to-port="0" /> <edge from-layer="2774" from-port="0" to-layer="2775" to-port="0" /> <edge from-layer="2775" from-port="1" to-layer="2776" to-port="1" /> <edge from-layer="2776" from-port="2" to-layer="2778" to-port="0" /> <edge from-layer="2777" from-port="0" to-layer="2778" to-port="1" /> <edge from-layer="2778" from-port="2" to-layer="2780" to-port="0" /> <edge from-layer="2779" from-port="0" to-layer="2780" to-port="1" /> <edge from-layer="2780" from-port="2" to-layer="2781" to-port="0" /> <edge from-layer="2781" from-port="1" to-layer="2782" to-port="1" /> <edge from-layer="2782" from-port="2" to-layer="2784" to-port="0" /> <edge from-layer="2783" from-port="0" to-layer="2784" to-port="1" /> <edge from-layer="2784" from-port="2" to-layer="2786" to-port="0" /> <edge from-layer="2785" from-port="0" to-layer="2786" to-port="1" /> <edge from-layer="2786" from-port="2" to-layer="2788" to-port="0" /> <edge from-layer="2787" from-port="0" to-layer="2788" to-port="1" /> <edge from-layer="2788" from-port="2" to-layer="2789" to-port="0" /> <edge from-layer="2789" from-port="3" to-layer="2791" to-port="0" /> <edge from-layer="2790" from-port="0" to-layer="2791" to-port="1" /> <edge from-layer="2791" from-port="2" to-layer="2793" to-port="0" /> <edge from-layer="2792" from-port="0" to-layer="2793" to-port="1" /> <edge from-layer="2793" from-port="2" to-layer="2804" to-port="0" /> <edge from-layer="2794" from-port="0" to-layer="2795" to-port="0" /> <edge from-layer="2795" from-port="1" to-layer="2798" to-port="0" /> <edge from-layer="2796" from-port="0" to-layer="2797" to-port="0" /> <edge from-layer="2797" from-port="1" to-layer="2798" to-port="1" /> <edge from-layer="2798" from-port="2" to-layer="2800" to-port="0" /> <edge from-layer="2799" from-port="0" to-layer="2800" to-port="1" /> <edge from-layer="2800" from-port="2" to-layer="2802" to-port="0" /> <edge from-layer="2801" from-port="0" to-layer="2802" to-port="1" /> <edge from-layer="2802" from-port="2" to-layer="2803" to-port="0" /> <edge from-layer="2803" from-port="1" to-layer="2804" to-port="1" /> <edge from-layer="2804" from-port="2" to-layer="2806" to-port="0" /> <edge from-layer="2805" from-port="0" to-layer="2806" to-port="1" /> <edge from-layer="2806" from-port="2" to-layer="2807" to-port="1" /> <edge from-layer="2807" from-port="2" to-layer="2809" to-port="0" /> <edge from-layer="2807" from-port="2" to-layer="2841" to-port="0" /> <edge from-layer="2808" from-port="0" to-layer="2809" to-port="1" /> <edge from-layer="2809" from-port="2" to-layer="2811" to-port="0" /> <edge from-layer="2810" from-port="0" to-layer="2811" to-port="1" /> <edge from-layer="2811" from-port="2" to-layer="2813" to-port="0" /> <edge from-layer="2812" from-port="0" to-layer="2813" to-port="1" /> <edge from-layer="2813" from-port="2" to-layer="2824" to-port="0" /> <edge from-layer="2814" from-port="0" to-layer="2815" to-port="0" /> <edge from-layer="2815" from-port="1" to-layer="2818" to-port="0" /> <edge from-layer="2816" from-port="0" to-layer="2817" to-port="0" /> <edge from-layer="2817" from-port="1" to-layer="2818" to-port="1" /> <edge from-layer="2818" from-port="2" to-layer="2820" to-port="0" /> <edge from-layer="2819" from-port="0" to-layer="2820" to-port="1" /> <edge from-layer="2820" from-port="2" to-layer="2822" to-port="0" /> <edge from-layer="2821" from-port="0" to-layer="2822" to-port="1" /> <edge from-layer="2822" from-port="2" to-layer="2823" to-port="0" /> <edge from-layer="2823" from-port="1" to-layer="2824" to-port="1" /> <edge from-layer="2824" from-port="2" to-layer="2826" to-port="0" /> <edge from-layer="2825" from-port="0" to-layer="2826" to-port="1" /> <edge from-layer="2826" from-port="2" to-layer="2827" to-port="0" /> <edge from-layer="2827" from-port="1" to-layer="2838" to-port="0" /> <edge from-layer="2828" from-port="0" to-layer="2829" to-port="0" /> <edge from-layer="2829" from-port="1" to-layer="2832" to-port="0" /> <edge from-layer="2830" from-port="0" to-layer="2831" to-port="0" /> <edge from-layer="2831" from-port="1" to-layer="2832" to-port="1" /> <edge from-layer="2832" from-port="2" to-layer="2834" to-port="0" /> <edge from-layer="2833" from-port="0" to-layer="2834" to-port="1" /> <edge from-layer="2834" from-port="2" to-layer="2836" to-port="0" /> <edge from-layer="2835" from-port="0" to-layer="2836" to-port="1" /> <edge from-layer="2836" from-port="2" to-layer="2837" to-port="0" /> <edge from-layer="2837" from-port="1" to-layer="2838" to-port="1" /> <edge from-layer="2838" from-port="2" to-layer="2840" to-port="0" /> <edge from-layer="2839" from-port="0" to-layer="2840" to-port="1" /> <edge from-layer="2840" from-port="2" to-layer="2841" to-port="1" /> <edge from-layer="2841" from-port="2" to-layer="2843" to-port="0" /> <edge from-layer="2841" from-port="2" to-layer="2935" to-port="0" /> <edge from-layer="2842" from-port="0" to-layer="2843" to-port="1" /> <edge from-layer="2843" from-port="2" to-layer="2845" to-port="0" /> <edge from-layer="2844" from-port="0" to-layer="2845" to-port="1" /> <edge from-layer="2845" from-port="2" to-layer="2847" to-port="0" /> <edge from-layer="2846" from-port="0" to-layer="2847" to-port="1" /> <edge from-layer="2847" from-port="2" to-layer="2858" to-port="0" /> <edge from-layer="2847" from-port="2" to-layer="2909" to-port="0" /> <edge from-layer="2847" from-port="2" to-layer="2884" to-port="0" /> <edge from-layer="2848" from-port="0" to-layer="2849" to-port="0" /> <edge from-layer="2849" from-port="1" to-layer="2852" to-port="0" /> <edge from-layer="2850" from-port="0" to-layer="2851" to-port="0" /> <edge from-layer="2851" from-port="1" to-layer="2852" to-port="1" /> <edge from-layer="2852" from-port="2" to-layer="2854" to-port="0" /> <edge from-layer="2853" from-port="0" to-layer="2854" to-port="1" /> <edge from-layer="2854" from-port="2" to-layer="2856" to-port="0" /> <edge from-layer="2855" from-port="0" to-layer="2856" to-port="1" /> <edge from-layer="2856" from-port="2" to-layer="2857" to-port="0" /> <edge from-layer="2857" from-port="1" to-layer="2858" to-port="1" /> <edge from-layer="2858" from-port="2" to-layer="2860" to-port="0" /> <edge from-layer="2859" from-port="0" to-layer="2860" to-port="1" /> <edge from-layer="2860" from-port="2" to-layer="2862" to-port="0" /> <edge from-layer="2861" from-port="0" to-layer="2862" to-port="1" /> <edge from-layer="2862" from-port="2" to-layer="2864" to-port="0" /> <edge from-layer="2863" from-port="0" to-layer="2864" to-port="1" /> <edge from-layer="2864" from-port="2" to-layer="2917" to-port="0" /> <edge from-layer="2865" from-port="0" to-layer="2870" to-port="0" /> <edge from-layer="2866" from-port="0" to-layer="2869" to-port="1" /> <edge from-layer="2867" from-port="0" to-layer="2869" to-port="2" /> <edge from-layer="2868" from-port="0" to-layer="2869" to-port="3" /> <edge from-layer="2869" from-port="4" to-layer="2870" to-port="1" /> <edge from-layer="2870" from-port="2" to-layer="2871" to-port="0" /> <edge from-layer="2871" from-port="1" to-layer="2873" to-port="0" /> <edge from-layer="2872" from-port="0" to-layer="2873" to-port="2" /> <edge from-layer="2873" from-port="3" to-layer="2889" to-port="0" /> <edge from-layer="2874" from-port="0" to-layer="2875" to-port="0" /> <edge from-layer="2875" from-port="1" to-layer="2878" to-port="0" /> <edge from-layer="2876" from-port="0" to-layer="2877" to-port="0" /> <edge from-layer="2877" from-port="1" to-layer="2878" to-port="1" /> <edge from-layer="2878" from-port="2" to-layer="2880" to-port="0" /> <edge from-layer="2879" from-port="0" to-layer="2880" to-port="1" /> <edge from-layer="2880" from-port="2" to-layer="2882" to-port="0" /> <edge from-layer="2881" from-port="0" to-layer="2882" to-port="1" /> <edge from-layer="2882" from-port="2" to-layer="2883" to-port="0" /> <edge from-layer="2883" from-port="1" to-layer="2884" to-port="1" /> <edge from-layer="2884" from-port="2" to-layer="2886" to-port="0" /> <edge from-layer="2885" from-port="0" to-layer="2886" to-port="1" /> <edge from-layer="2886" from-port="2" to-layer="2888" to-port="0" /> <edge from-layer="2887" from-port="0" to-layer="2888" to-port="1" /> <edge from-layer="2888" from-port="2" to-layer="2889" to-port="1" /> <edge from-layer="2889" from-port="2" to-layer="4958" to-port="0" /> <edge from-layer="2889" from-port="2" to-layer="2917" to-port="1" /> <edge from-layer="2890" from-port="0" to-layer="2895" to-port="0" /> <edge from-layer="2891" from-port="0" to-layer="2894" to-port="1" /> <edge from-layer="2892" from-port="0" to-layer="2894" to-port="2" /> <edge from-layer="2893" from-port="0" to-layer="2894" to-port="3" /> <edge from-layer="2894" from-port="4" to-layer="2895" to-port="1" /> <edge from-layer="2895" from-port="2" to-layer="2896" to-port="0" /> <edge from-layer="2896" from-port="1" to-layer="2898" to-port="0" /> <edge from-layer="2897" from-port="0" to-layer="2898" to-port="2" /> <edge from-layer="2898" from-port="3" to-layer="2916" to-port="0" /> <edge from-layer="2899" from-port="0" to-layer="2900" to-port="0" /> <edge from-layer="2900" from-port="1" to-layer="2903" to-port="0" /> <edge from-layer="2901" from-port="0" to-layer="2902" to-port="0" /> <edge from-layer="2902" from-port="1" to-layer="2903" to-port="1" /> <edge from-layer="2903" from-port="2" to-layer="2905" to-port="0" /> <edge from-layer="2904" from-port="0" to-layer="2905" to-port="1" /> <edge from-layer="2905" from-port="2" to-layer="2907" to-port="0" /> <edge from-layer="2906" from-port="0" to-layer="2907" to-port="1" /> <edge from-layer="2907" from-port="2" to-layer="2908" to-port="0" /> <edge from-layer="2908" from-port="1" to-layer="2909" to-port="1" /> <edge from-layer="2909" from-port="2" to-layer="2911" to-port="0" /> <edge from-layer="2910" from-port="0" to-layer="2911" to-port="1" /> <edge from-layer="2911" from-port="2" to-layer="2913" to-port="0" /> <edge from-layer="2912" from-port="0" to-layer="2913" to-port="1" /> <edge from-layer="2913" from-port="2" to-layer="2915" to-port="0" /> <edge from-layer="2914" from-port="0" to-layer="2915" to-port="1" /> <edge from-layer="2915" from-port="2" to-layer="2916" to-port="1" /> <edge from-layer="2916" from-port="2" to-layer="2917" to-port="2" /> <edge from-layer="2916" from-port="2" to-layer="4957" to-port="0" /> <edge from-layer="2917" from-port="4" to-layer="2919" to-port="0" /> <edge from-layer="2918" from-port="0" to-layer="2919" to-port="1" /> <edge from-layer="2919" from-port="2" to-layer="2921" to-port="0" /> <edge from-layer="2920" from-port="0" to-layer="2921" to-port="1" /> <edge from-layer="2921" from-port="2" to-layer="2932" to-port="0" /> <edge from-layer="2922" from-port="0" to-layer="2923" to-port="0" /> <edge from-layer="2923" from-port="1" to-layer="2926" to-port="0" /> <edge from-layer="2924" from-port="0" to-layer="2925" to-port="0" /> <edge from-layer="2925" from-port="1" to-layer="2926" to-port="1" /> <edge from-layer="2926" from-port="2" to-layer="2928" to-port="0" /> <edge from-layer="2927" from-port="0" to-layer="2928" to-port="1" /> <edge from-layer="2928" from-port="2" to-layer="2930" to-port="0" /> <edge from-layer="2929" from-port="0" to-layer="2930" to-port="1" /> <edge from-layer="2930" from-port="2" to-layer="2931" to-port="0" /> <edge from-layer="2931" from-port="1" to-layer="2932" to-port="1" /> <edge from-layer="2932" from-port="2" to-layer="2934" to-port="0" /> <edge from-layer="2933" from-port="0" to-layer="2934" to-port="1" /> <edge from-layer="2934" from-port="2" to-layer="2935" to-port="1" /> <edge from-layer="2935" from-port="2" to-layer="2937" to-port="0" /> <edge from-layer="2935" from-port="2" to-layer="2977" to-port="0" /> <edge from-layer="2936" from-port="0" to-layer="2937" to-port="1" /> <edge from-layer="2937" from-port="2" to-layer="2939" to-port="0" /> <edge from-layer="2938" from-port="0" to-layer="2939" to-port="1" /> <edge from-layer="2939" from-port="2" to-layer="2941" to-port="0" /> <edge from-layer="2940" from-port="0" to-layer="2941" to-port="1" /> <edge from-layer="2941" from-port="2" to-layer="2952" to-port="0" /> <edge from-layer="2942" from-port="0" to-layer="2943" to-port="0" /> <edge from-layer="2943" from-port="1" to-layer="2946" to-port="0" /> <edge from-layer="2944" from-port="0" to-layer="2945" to-port="0" /> <edge from-layer="2945" from-port="1" to-layer="2946" to-port="1" /> <edge from-layer="2946" from-port="2" to-layer="2948" to-port="0" /> <edge from-layer="2947" from-port="0" to-layer="2948" to-port="1" /> <edge from-layer="2948" from-port="2" to-layer="2950" to-port="0" /> <edge from-layer="2949" from-port="0" to-layer="2950" to-port="1" /> <edge from-layer="2950" from-port="2" to-layer="2951" to-port="0" /> <edge from-layer="2951" from-port="1" to-layer="2952" to-port="1" /> <edge from-layer="2952" from-port="2" to-layer="2954" to-port="0" /> <edge from-layer="2953" from-port="0" to-layer="2954" to-port="1" /> <edge from-layer="2954" from-port="2" to-layer="2956" to-port="0" /> <edge from-layer="2955" from-port="0" to-layer="2956" to-port="1" /> <edge from-layer="2956" from-port="2" to-layer="2958" to-port="0" /> <edge from-layer="2957" from-port="0" to-layer="2958" to-port="1" /> <edge from-layer="2958" from-port="2" to-layer="2959" to-port="0" /> <edge from-layer="2959" from-port="3" to-layer="2961" to-port="0" /> <edge from-layer="2960" from-port="0" to-layer="2961" to-port="1" /> <edge from-layer="2961" from-port="2" to-layer="2963" to-port="0" /> <edge from-layer="2962" from-port="0" to-layer="2963" to-port="1" /> <edge from-layer="2963" from-port="2" to-layer="2974" to-port="0" /> <edge from-layer="2964" from-port="0" to-layer="2965" to-port="0" /> <edge from-layer="2965" from-port="1" to-layer="2968" to-port="0" /> <edge from-layer="2966" from-port="0" to-layer="2967" to-port="0" /> <edge from-layer="2967" from-port="1" to-layer="2968" to-port="1" /> <edge from-layer="2968" from-port="2" to-layer="2970" to-port="0" /> <edge from-layer="2969" from-port="0" to-layer="2970" to-port="1" /> <edge from-layer="2970" from-port="2" to-layer="2972" to-port="0" /> <edge from-layer="2971" from-port="0" to-layer="2972" to-port="1" /> <edge from-layer="2972" from-port="2" to-layer="2973" to-port="0" /> <edge from-layer="2973" from-port="1" to-layer="2974" to-port="1" /> <edge from-layer="2974" from-port="2" to-layer="2976" to-port="0" /> <edge from-layer="2975" from-port="0" to-layer="2976" to-port="1" /> <edge from-layer="2976" from-port="2" to-layer="2977" to-port="1" /> <edge from-layer="2977" from-port="2" to-layer="2979" to-port="0" /> <edge from-layer="2977" from-port="2" to-layer="3011" to-port="0" /> <edge from-layer="2978" from-port="0" to-layer="2979" to-port="1" /> <edge from-layer="2979" from-port="2" to-layer="2981" to-port="0" /> <edge from-layer="2980" from-port="0" to-layer="2981" to-port="1" /> <edge from-layer="2981" from-port="2" to-layer="2983" to-port="0" /> <edge from-layer="2982" from-port="0" to-layer="2983" to-port="1" /> <edge from-layer="2983" from-port="2" to-layer="2994" to-port="0" /> <edge from-layer="2984" from-port="0" to-layer="2985" to-port="0" /> <edge from-layer="2985" from-port="1" to-layer="2988" to-port="0" /> <edge from-layer="2986" from-port="0" to-layer="2987" to-port="0" /> <edge from-layer="2987" from-port="1" to-layer="2988" to-port="1" /> <edge from-layer="2988" from-port="2" to-layer="2990" to-port="0" /> <edge from-layer="2989" from-port="0" to-layer="2990" to-port="1" /> <edge from-layer="2990" from-port="2" to-layer="2992" to-port="0" /> <edge from-layer="2991" from-port="0" to-layer="2992" to-port="1" /> <edge from-layer="2992" from-port="2" to-layer="2993" to-port="0" /> <edge from-layer="2993" from-port="1" to-layer="2994" to-port="1" /> <edge from-layer="2994" from-port="2" to-layer="2996" to-port="0" /> <edge from-layer="2995" from-port="0" to-layer="2996" to-port="1" /> <edge from-layer="2996" from-port="2" to-layer="2997" to-port="0" /> <edge from-layer="2997" from-port="1" to-layer="3008" to-port="0" /> <edge from-layer="2998" from-port="0" to-layer="2999" to-port="0" /> <edge from-layer="2999" from-port="1" to-layer="3002" to-port="0" /> <edge from-layer="3000" from-port="0" to-layer="3001" to-port="0" /> <edge from-layer="3001" from-port="1" to-layer="3002" to-port="1" /> <edge from-layer="3002" from-port="2" to-layer="3004" to-port="0" /> <edge from-layer="3003" from-port="0" to-layer="3004" to-port="1" /> <edge from-layer="3004" from-port="2" to-layer="3006" to-port="0" /> <edge from-layer="3005" from-port="0" to-layer="3006" to-port="1" /> <edge from-layer="3006" from-port="2" to-layer="3007" to-port="0" /> <edge from-layer="3007" from-port="1" to-layer="3008" to-port="1" /> <edge from-layer="3008" from-port="2" to-layer="3010" to-port="0" /> <edge from-layer="3009" from-port="0" to-layer="3010" to-port="1" /> <edge from-layer="3010" from-port="2" to-layer="3011" to-port="1" /> <edge from-layer="3011" from-port="2" to-layer="3013" to-port="0" /> <edge from-layer="3011" from-port="2" to-layer="3105" to-port="0" /> <edge from-layer="3012" from-port="0" to-layer="3013" to-port="1" /> <edge from-layer="3013" from-port="2" to-layer="3015" to-port="0" /> <edge from-layer="3014" from-port="0" to-layer="3015" to-port="1" /> <edge from-layer="3015" from-port="2" to-layer="3017" to-port="0" /> <edge from-layer="3016" from-port="0" to-layer="3017" to-port="1" /> <edge from-layer="3017" from-port="2" to-layer="3028" to-port="0" /> <edge from-layer="3017" from-port="2" to-layer="3079" to-port="0" /> <edge from-layer="3017" from-port="2" to-layer="3054" to-port="0" /> <edge from-layer="3018" from-port="0" to-layer="3019" to-port="0" /> <edge from-layer="3019" from-port="1" to-layer="3022" to-port="0" /> <edge from-layer="3020" from-port="0" to-layer="3021" to-port="0" /> <edge from-layer="3021" from-port="1" to-layer="3022" to-port="1" /> <edge from-layer="3022" from-port="2" to-layer="3024" to-port="0" /> <edge from-layer="3023" from-port="0" to-layer="3024" to-port="1" /> <edge from-layer="3024" from-port="2" to-layer="3026" to-port="0" /> <edge from-layer="3025" from-port="0" to-layer="3026" to-port="1" /> <edge from-layer="3026" from-port="2" to-layer="3027" to-port="0" /> <edge from-layer="3027" from-port="1" to-layer="3028" to-port="1" /> <edge from-layer="3028" from-port="2" to-layer="3030" to-port="0" /> <edge from-layer="3029" from-port="0" to-layer="3030" to-port="1" /> <edge from-layer="3030" from-port="2" to-layer="3032" to-port="0" /> <edge from-layer="3031" from-port="0" to-layer="3032" to-port="1" /> <edge from-layer="3032" from-port="2" to-layer="3034" to-port="0" /> <edge from-layer="3033" from-port="0" to-layer="3034" to-port="1" /> <edge from-layer="3034" from-port="2" to-layer="3087" to-port="0" /> <edge from-layer="3035" from-port="0" to-layer="3040" to-port="0" /> <edge from-layer="3036" from-port="0" to-layer="3039" to-port="1" /> <edge from-layer="3037" from-port="0" to-layer="3039" to-port="2" /> <edge from-layer="3038" from-port="0" to-layer="3039" to-port="3" /> <edge from-layer="3039" from-port="4" to-layer="3040" to-port="1" /> <edge from-layer="3040" from-port="2" to-layer="3041" to-port="0" /> <edge from-layer="3041" from-port="1" to-layer="3043" to-port="0" /> <edge from-layer="3042" from-port="0" to-layer="3043" to-port="2" /> <edge from-layer="3043" from-port="3" to-layer="3059" to-port="0" /> <edge from-layer="3044" from-port="0" to-layer="3045" to-port="0" /> <edge from-layer="3045" from-port="1" to-layer="3048" to-port="0" /> <edge from-layer="3046" from-port="0" to-layer="3047" to-port="0" /> <edge from-layer="3047" from-port="1" to-layer="3048" to-port="1" /> <edge from-layer="3048" from-port="2" to-layer="3050" to-port="0" /> <edge from-layer="3049" from-port="0" to-layer="3050" to-port="1" /> <edge from-layer="3050" from-port="2" to-layer="3052" to-port="0" /> <edge from-layer="3051" from-port="0" to-layer="3052" to-port="1" /> <edge from-layer="3052" from-port="2" to-layer="3053" to-port="0" /> <edge from-layer="3053" from-port="1" to-layer="3054" to-port="1" /> <edge from-layer="3054" from-port="2" to-layer="3056" to-port="0" /> <edge from-layer="3055" from-port="0" to-layer="3056" to-port="1" /> <edge from-layer="3056" from-port="2" to-layer="3058" to-port="0" /> <edge from-layer="3057" from-port="0" to-layer="3058" to-port="1" /> <edge from-layer="3058" from-port="2" to-layer="3059" to-port="1" /> <edge from-layer="3059" from-port="2" to-layer="4956" to-port="0" /> <edge from-layer="3059" from-port="2" to-layer="3087" to-port="1" /> <edge from-layer="3060" from-port="0" to-layer="3065" to-port="0" /> <edge from-layer="3061" from-port="0" to-layer="3064" to-port="1" /> <edge from-layer="3062" from-port="0" to-layer="3064" to-port="2" /> <edge from-layer="3063" from-port="0" to-layer="3064" to-port="3" /> <edge from-layer="3064" from-port="4" to-layer="3065" to-port="1" /> <edge from-layer="3065" from-port="2" to-layer="3066" to-port="0" /> <edge from-layer="3066" from-port="1" to-layer="3068" to-port="0" /> <edge from-layer="3067" from-port="0" to-layer="3068" to-port="2" /> <edge from-layer="3068" from-port="3" to-layer="3086" to-port="0" /> <edge from-layer="3069" from-port="0" to-layer="3070" to-port="0" /> <edge from-layer="3070" from-port="1" to-layer="3073" to-port="0" /> <edge from-layer="3071" from-port="0" to-layer="3072" to-port="0" /> <edge from-layer="3072" from-port="1" to-layer="3073" to-port="1" /> <edge from-layer="3073" from-port="2" to-layer="3075" to-port="0" /> <edge from-layer="3074" from-port="0" to-layer="3075" to-port="1" /> <edge from-layer="3075" from-port="2" to-layer="3077" to-port="0" /> <edge from-layer="3076" from-port="0" to-layer="3077" to-port="1" /> <edge from-layer="3077" from-port="2" to-layer="3078" to-port="0" /> <edge from-layer="3078" from-port="1" to-layer="3079" to-port="1" /> <edge from-layer="3079" from-port="2" to-layer="3081" to-port="0" /> <edge from-layer="3080" from-port="0" to-layer="3081" to-port="1" /> <edge from-layer="3081" from-port="2" to-layer="3083" to-port="0" /> <edge from-layer="3082" from-port="0" to-layer="3083" to-port="1" /> <edge from-layer="3083" from-port="2" to-layer="3085" to-port="0" /> <edge from-layer="3084" from-port="0" to-layer="3085" to-port="1" /> <edge from-layer="3085" from-port="2" to-layer="3086" to-port="1" /> <edge from-layer="3086" from-port="2" to-layer="4955" to-port="0" /> <edge from-layer="3086" from-port="2" to-layer="3087" to-port="2" /> <edge from-layer="3087" from-port="4" to-layer="3089" to-port="0" /> <edge from-layer="3088" from-port="0" to-layer="3089" to-port="1" /> <edge from-layer="3089" from-port="2" to-layer="3091" to-port="0" /> <edge from-layer="3090" from-port="0" to-layer="3091" to-port="1" /> <edge from-layer="3091" from-port="2" to-layer="3102" to-port="0" /> <edge from-layer="3092" from-port="0" to-layer="3093" to-port="0" /> <edge from-layer="3093" from-port="1" to-layer="3096" to-port="0" /> <edge from-layer="3094" from-port="0" to-layer="3095" to-port="0" /> <edge from-layer="3095" from-port="1" to-layer="3096" to-port="1" /> <edge from-layer="3096" from-port="2" to-layer="3098" to-port="0" /> <edge from-layer="3097" from-port="0" to-layer="3098" to-port="1" /> <edge from-layer="3098" from-port="2" to-layer="3100" to-port="0" /> <edge from-layer="3099" from-port="0" to-layer="3100" to-port="1" /> <edge from-layer="3100" from-port="2" to-layer="3101" to-port="0" /> <edge from-layer="3101" from-port="1" to-layer="3102" to-port="1" /> <edge from-layer="3102" from-port="2" to-layer="3104" to-port="0" /> <edge from-layer="3103" from-port="0" to-layer="3104" to-port="1" /> <edge from-layer="3104" from-port="2" to-layer="3105" to-port="1" /> <edge from-layer="3105" from-port="2" to-layer="3107" to-port="0" /> <edge from-layer="3105" from-port="2" to-layer="3147" to-port="0" /> <edge from-layer="3106" from-port="0" to-layer="3107" to-port="1" /> <edge from-layer="3107" from-port="2" to-layer="3109" to-port="0" /> <edge from-layer="3108" from-port="0" to-layer="3109" to-port="1" /> <edge from-layer="3109" from-port="2" to-layer="3111" to-port="0" /> <edge from-layer="3110" from-port="0" to-layer="3111" to-port="1" /> <edge from-layer="3111" from-port="2" to-layer="3122" to-port="0" /> <edge from-layer="3112" from-port="0" to-layer="3113" to-port="0" /> <edge from-layer="3113" from-port="1" to-layer="3116" to-port="0" /> <edge from-layer="3114" from-port="0" to-layer="3115" to-port="0" /> <edge from-layer="3115" from-port="1" to-layer="3116" to-port="1" /> <edge from-layer="3116" from-port="2" to-layer="3118" to-port="0" /> <edge from-layer="3117" from-port="0" to-layer="3118" to-port="1" /> <edge from-layer="3118" from-port="2" to-layer="3120" to-port="0" /> <edge from-layer="3119" from-port="0" to-layer="3120" to-port="1" /> <edge from-layer="3120" from-port="2" to-layer="3121" to-port="0" /> <edge from-layer="3121" from-port="1" to-layer="3122" to-port="1" /> <edge from-layer="3122" from-port="2" to-layer="3124" to-port="0" /> <edge from-layer="3123" from-port="0" to-layer="3124" to-port="1" /> <edge from-layer="3124" from-port="2" to-layer="3126" to-port="0" /> <edge from-layer="3125" from-port="0" to-layer="3126" to-port="1" /> <edge from-layer="3126" from-port="2" to-layer="3128" to-port="0" /> <edge from-layer="3127" from-port="0" to-layer="3128" to-port="1" /> <edge from-layer="3128" from-port="2" to-layer="3129" to-port="0" /> <edge from-layer="3129" from-port="3" to-layer="3131" to-port="0" /> <edge from-layer="3130" from-port="0" to-layer="3131" to-port="1" /> <edge from-layer="3131" from-port="2" to-layer="3133" to-port="0" /> <edge from-layer="3132" from-port="0" to-layer="3133" to-port="1" /> <edge from-layer="3133" from-port="2" to-layer="3144" to-port="0" /> <edge from-layer="3134" from-port="0" to-layer="3135" to-port="0" /> <edge from-layer="3135" from-port="1" to-layer="3138" to-port="0" /> <edge from-layer="3136" from-port="0" to-layer="3137" to-port="0" /> <edge from-layer="3137" from-port="1" to-layer="3138" to-port="1" /> <edge from-layer="3138" from-port="2" to-layer="3140" to-port="0" /> <edge from-layer="3139" from-port="0" to-layer="3140" to-port="1" /> <edge from-layer="3140" from-port="2" to-layer="3142" to-port="0" /> <edge from-layer="3141" from-port="0" to-layer="3142" to-port="1" /> <edge from-layer="3142" from-port="2" to-layer="3143" to-port="0" /> <edge from-layer="3143" from-port="1" to-layer="3144" to-port="1" /> <edge from-layer="3144" from-port="2" to-layer="3146" to-port="0" /> <edge from-layer="3145" from-port="0" to-layer="3146" to-port="1" /> <edge from-layer="3146" from-port="2" to-layer="3147" to-port="1" /> <edge from-layer="3147" from-port="2" to-layer="3181" to-port="0" /> <edge from-layer="3147" from-port="2" to-layer="3149" to-port="0" /> <edge from-layer="3148" from-port="0" to-layer="3149" to-port="1" /> <edge from-layer="3149" from-port="2" to-layer="3151" to-port="0" /> <edge from-layer="3150" from-port="0" to-layer="3151" to-port="1" /> <edge from-layer="3151" from-port="2" to-layer="3153" to-port="0" /> <edge from-layer="3152" from-port="0" to-layer="3153" to-port="1" /> <edge from-layer="3153" from-port="2" to-layer="3164" to-port="0" /> <edge from-layer="3154" from-port="0" to-layer="3155" to-port="0" /> <edge from-layer="3155" from-port="1" to-layer="3158" to-port="0" /> <edge from-layer="3156" from-port="0" to-layer="3157" to-port="0" /> <edge from-layer="3157" from-port="1" to-layer="3158" to-port="1" /> <edge from-layer="3158" from-port="2" to-layer="3160" to-port="0" /> <edge from-layer="3159" from-port="0" to-layer="3160" to-port="1" /> <edge from-layer="3160" from-port="2" to-layer="3162" to-port="0" /> <edge from-layer="3161" from-port="0" to-layer="3162" to-port="1" /> <edge from-layer="3162" from-port="2" to-layer="3163" to-port="0" /> <edge from-layer="3163" from-port="1" to-layer="3164" to-port="1" /> <edge from-layer="3164" from-port="2" to-layer="3166" to-port="0" /> <edge from-layer="3165" from-port="0" to-layer="3166" to-port="1" /> <edge from-layer="3166" from-port="2" to-layer="3167" to-port="0" /> <edge from-layer="3167" from-port="1" to-layer="3178" to-port="0" /> <edge from-layer="3168" from-port="0" to-layer="3169" to-port="0" /> <edge from-layer="3169" from-port="1" to-layer="3172" to-port="0" /> <edge from-layer="3170" from-port="0" to-layer="3171" to-port="0" /> <edge from-layer="3171" from-port="1" to-layer="3172" to-port="1" /> <edge from-layer="3172" from-port="2" to-layer="3174" to-port="0" /> <edge from-layer="3173" from-port="0" to-layer="3174" to-port="1" /> <edge from-layer="3174" from-port="2" to-layer="3176" to-port="0" /> <edge from-layer="3175" from-port="0" to-layer="3176" to-port="1" /> <edge from-layer="3176" from-port="2" to-layer="3177" to-port="0" /> <edge from-layer="3177" from-port="1" to-layer="3178" to-port="1" /> <edge from-layer="3178" from-port="2" to-layer="3180" to-port="0" /> <edge from-layer="3179" from-port="0" to-layer="3180" to-port="1" /> <edge from-layer="3180" from-port="2" to-layer="3181" to-port="1" /> <edge from-layer="3181" from-port="2" to-layer="3275" to-port="0" /> <edge from-layer="3181" from-port="2" to-layer="3183" to-port="0" /> <edge from-layer="3182" from-port="0" to-layer="3183" to-port="1" /> <edge from-layer="3183" from-port="2" to-layer="3185" to-port="0" /> <edge from-layer="3184" from-port="0" to-layer="3185" to-port="1" /> <edge from-layer="3185" from-port="2" to-layer="3187" to-port="0" /> <edge from-layer="3186" from-port="0" to-layer="3187" to-port="1" /> <edge from-layer="3187" from-port="2" to-layer="3224" to-port="0" /> <edge from-layer="3187" from-port="2" to-layer="3249" to-port="0" /> <edge from-layer="3187" from-port="2" to-layer="3198" to-port="0" /> <edge from-layer="3188" from-port="0" to-layer="3189" to-port="0" /> <edge from-layer="3189" from-port="1" to-layer="3192" to-port="0" /> <edge from-layer="3190" from-port="0" to-layer="3191" to-port="0" /> <edge from-layer="3191" from-port="1" to-layer="3192" to-port="1" /> <edge from-layer="3192" from-port="2" to-layer="3194" to-port="0" /> <edge from-layer="3193" from-port="0" to-layer="3194" to-port="1" /> <edge from-layer="3194" from-port="2" to-layer="3196" to-port="0" /> <edge from-layer="3195" from-port="0" to-layer="3196" to-port="1" /> <edge from-layer="3196" from-port="2" to-layer="3197" to-port="0" /> <edge from-layer="3197" from-port="1" to-layer="3198" to-port="1" /> <edge from-layer="3198" from-port="2" to-layer="3200" to-port="0" /> <edge from-layer="3199" from-port="0" to-layer="3200" to-port="1" /> <edge from-layer="3200" from-port="2" to-layer="3202" to-port="0" /> <edge from-layer="3201" from-port="0" to-layer="3202" to-port="1" /> <edge from-layer="3202" from-port="2" to-layer="3204" to-port="0" /> <edge from-layer="3203" from-port="0" to-layer="3204" to-port="1" /> <edge from-layer="3204" from-port="2" to-layer="3257" to-port="0" /> <edge from-layer="3205" from-port="0" to-layer="3210" to-port="0" /> <edge from-layer="3206" from-port="0" to-layer="3209" to-port="1" /> <edge from-layer="3207" from-port="0" to-layer="3209" to-port="2" /> <edge from-layer="3208" from-port="0" to-layer="3209" to-port="3" /> <edge from-layer="3209" from-port="4" to-layer="3210" to-port="1" /> <edge from-layer="3210" from-port="2" to-layer="3211" to-port="0" /> <edge from-layer="3211" from-port="1" to-layer="3213" to-port="0" /> <edge from-layer="3212" from-port="0" to-layer="3213" to-port="2" /> <edge from-layer="3213" from-port="3" to-layer="3229" to-port="0" /> <edge from-layer="3214" from-port="0" to-layer="3215" to-port="0" /> <edge from-layer="3215" from-port="1" to-layer="3218" to-port="0" /> <edge from-layer="3216" from-port="0" to-layer="3217" to-port="0" /> <edge from-layer="3217" from-port="1" to-layer="3218" to-port="1" /> <edge from-layer="3218" from-port="2" to-layer="3220" to-port="0" /> <edge from-layer="3219" from-port="0" to-layer="3220" to-port="1" /> <edge from-layer="3220" from-port="2" to-layer="3222" to-port="0" /> <edge from-layer="3221" from-port="0" to-layer="3222" to-port="1" /> <edge from-layer="3222" from-port="2" to-layer="3223" to-port="0" /> <edge from-layer="3223" from-port="1" to-layer="3224" to-port="1" /> <edge from-layer="3224" from-port="2" to-layer="3226" to-port="0" /> <edge from-layer="3225" from-port="0" to-layer="3226" to-port="1" /> <edge from-layer="3226" from-port="2" to-layer="3228" to-port="0" /> <edge from-layer="3227" from-port="0" to-layer="3228" to-port="1" /> <edge from-layer="3228" from-port="2" to-layer="3229" to-port="1" /> <edge from-layer="3229" from-port="2" to-layer="3257" to-port="1" /> <edge from-layer="3229" from-port="2" to-layer="4954" to-port="0" /> <edge from-layer="3230" from-port="0" to-layer="3235" to-port="0" /> <edge from-layer="3231" from-port="0" to-layer="3234" to-port="1" /> <edge from-layer="3232" from-port="0" to-layer="3234" to-port="2" /> <edge from-layer="3233" from-port="0" to-layer="3234" to-port="3" /> <edge from-layer="3234" from-port="4" to-layer="3235" to-port="1" /> <edge from-layer="3235" from-port="2" to-layer="3236" to-port="0" /> <edge from-layer="3236" from-port="1" to-layer="3238" to-port="0" /> <edge from-layer="3237" from-port="0" to-layer="3238" to-port="2" /> <edge from-layer="3238" from-port="3" to-layer="3256" to-port="0" /> <edge from-layer="3239" from-port="0" to-layer="3240" to-port="0" /> <edge from-layer="3240" from-port="1" to-layer="3243" to-port="0" /> <edge from-layer="3241" from-port="0" to-layer="3242" to-port="0" /> <edge from-layer="3242" from-port="1" to-layer="3243" to-port="1" /> <edge from-layer="3243" from-port="2" to-layer="3245" to-port="0" /> <edge from-layer="3244" from-port="0" to-layer="3245" to-port="1" /> <edge from-layer="3245" from-port="2" to-layer="3247" to-port="0" /> <edge from-layer="3246" from-port="0" to-layer="3247" to-port="1" /> <edge from-layer="3247" from-port="2" to-layer="3248" to-port="0" /> <edge from-layer="3248" from-port="1" to-layer="3249" to-port="1" /> <edge from-layer="3249" from-port="2" to-layer="3251" to-port="0" /> <edge from-layer="3250" from-port="0" to-layer="3251" to-port="1" /> <edge from-layer="3251" from-port="2" to-layer="3253" to-port="0" /> <edge from-layer="3252" from-port="0" to-layer="3253" to-port="1" /> <edge from-layer="3253" from-port="2" to-layer="3255" to-port="0" /> <edge from-layer="3254" from-port="0" to-layer="3255" to-port="1" /> <edge from-layer="3255" from-port="2" to-layer="3256" to-port="1" /> <edge from-layer="3256" from-port="2" to-layer="3257" to-port="2" /> <edge from-layer="3256" from-port="2" to-layer="4953" to-port="0" /> <edge from-layer="3257" from-port="4" to-layer="3259" to-port="0" /> <edge from-layer="3258" from-port="0" to-layer="3259" to-port="1" /> <edge from-layer="3259" from-port="2" to-layer="3261" to-port="0" /> <edge from-layer="3260" from-port="0" to-layer="3261" to-port="1" /> <edge from-layer="3261" from-port="2" to-layer="3272" to-port="0" /> <edge from-layer="3262" from-port="0" to-layer="3263" to-port="0" /> <edge from-layer="3263" from-port="1" to-layer="3266" to-port="0" /> <edge from-layer="3264" from-port="0" to-layer="3265" to-port="0" /> <edge from-layer="3265" from-port="1" to-layer="3266" to-port="1" /> <edge from-layer="3266" from-port="2" to-layer="3268" to-port="0" /> <edge from-layer="3267" from-port="0" to-layer="3268" to-port="1" /> <edge from-layer="3268" from-port="2" to-layer="3270" to-port="0" /> <edge from-layer="3269" from-port="0" to-layer="3270" to-port="1" /> <edge from-layer="3270" from-port="2" to-layer="3271" to-port="0" /> <edge from-layer="3271" from-port="1" to-layer="3272" to-port="1" /> <edge from-layer="3272" from-port="2" to-layer="3274" to-port="0" /> <edge from-layer="3273" from-port="0" to-layer="3274" to-port="1" /> <edge from-layer="3274" from-port="2" to-layer="3275" to-port="1" /> <edge from-layer="3275" from-port="2" to-layer="3277" to-port="0" /> <edge from-layer="3275" from-port="2" to-layer="3317" to-port="0" /> <edge from-layer="3276" from-port="0" to-layer="3277" to-port="1" /> <edge from-layer="3277" from-port="2" to-layer="3279" to-port="0" /> <edge from-layer="3278" from-port="0" to-layer="3279" to-port="1" /> <edge from-layer="3279" from-port="2" to-layer="3281" to-port="0" /> <edge from-layer="3280" from-port="0" to-layer="3281" to-port="1" /> <edge from-layer="3281" from-port="2" to-layer="3292" to-port="0" /> <edge from-layer="3282" from-port="0" to-layer="3283" to-port="0" /> <edge from-layer="3283" from-port="1" to-layer="3286" to-port="0" /> <edge from-layer="3284" from-port="0" to-layer="3285" to-port="0" /> <edge from-layer="3285" from-port="1" to-layer="3286" to-port="1" /> <edge from-layer="3286" from-port="2" to-layer="3288" to-port="0" /> <edge from-layer="3287" from-port="0" to-layer="3288" to-port="1" /> <edge from-layer="3288" from-port="2" to-layer="3290" to-port="0" /> <edge from-layer="3289" from-port="0" to-layer="3290" to-port="1" /> <edge from-layer="3290" from-port="2" to-layer="3291" to-port="0" /> <edge from-layer="3291" from-port="1" to-layer="3292" to-port="1" /> <edge from-layer="3292" from-port="2" to-layer="3294" to-port="0" /> <edge from-layer="3293" from-port="0" to-layer="3294" to-port="1" /> <edge from-layer="3294" from-port="2" to-layer="3296" to-port="0" /> <edge from-layer="3295" from-port="0" to-layer="3296" to-port="1" /> <edge from-layer="3296" from-port="2" to-layer="3298" to-port="0" /> <edge from-layer="3297" from-port="0" to-layer="3298" to-port="1" /> <edge from-layer="3298" from-port="2" to-layer="3299" to-port="0" /> <edge from-layer="3299" from-port="3" to-layer="3301" to-port="0" /> <edge from-layer="3300" from-port="0" to-layer="3301" to-port="1" /> <edge from-layer="3301" from-port="2" to-layer="3303" to-port="0" /> <edge from-layer="3302" from-port="0" to-layer="3303" to-port="1" /> <edge from-layer="3303" from-port="2" to-layer="3314" to-port="0" /> <edge from-layer="3304" from-port="0" to-layer="3305" to-port="0" /> <edge from-layer="3305" from-port="1" to-layer="3308" to-port="0" /> <edge from-layer="3306" from-port="0" to-layer="3307" to-port="0" /> <edge from-layer="3307" from-port="1" to-layer="3308" to-port="1" /> <edge from-layer="3308" from-port="2" to-layer="3310" to-port="0" /> <edge from-layer="3309" from-port="0" to-layer="3310" to-port="1" /> <edge from-layer="3310" from-port="2" to-layer="3312" to-port="0" /> <edge from-layer="3311" from-port="0" to-layer="3312" to-port="1" /> <edge from-layer="3312" from-port="2" to-layer="3313" to-port="0" /> <edge from-layer="3313" from-port="1" to-layer="3314" to-port="1" /> <edge from-layer="3314" from-port="2" to-layer="3316" to-port="0" /> <edge from-layer="3315" from-port="0" to-layer="3316" to-port="1" /> <edge from-layer="3316" from-port="2" to-layer="3317" to-port="1" /> <edge from-layer="3317" from-port="2" to-layer="3319" to-port="0" /> <edge from-layer="3317" from-port="2" to-layer="3351" to-port="0" /> <edge from-layer="3318" from-port="0" to-layer="3319" to-port="1" /> <edge from-layer="3319" from-port="2" to-layer="3321" to-port="0" /> <edge from-layer="3320" from-port="0" to-layer="3321" to-port="1" /> <edge from-layer="3321" from-port="2" to-layer="3323" to-port="0" /> <edge from-layer="3322" from-port="0" to-layer="3323" to-port="1" /> <edge from-layer="3323" from-port="2" to-layer="3334" to-port="0" /> <edge from-layer="3324" from-port="0" to-layer="3325" to-port="0" /> <edge from-layer="3325" from-port="1" to-layer="3328" to-port="0" /> <edge from-layer="3326" from-port="0" to-layer="3327" to-port="0" /> <edge from-layer="3327" from-port="1" to-layer="3328" to-port="1" /> <edge from-layer="3328" from-port="2" to-layer="3330" to-port="0" /> <edge from-layer="3329" from-port="0" to-layer="3330" to-port="1" /> <edge from-layer="3330" from-port="2" to-layer="3332" to-port="0" /> <edge from-layer="3331" from-port="0" to-layer="3332" to-port="1" /> <edge from-layer="3332" from-port="2" to-layer="3333" to-port="0" /> <edge from-layer="3333" from-port="1" to-layer="3334" to-port="1" /> <edge from-layer="3334" from-port="2" to-layer="3336" to-port="0" /> <edge from-layer="3335" from-port="0" to-layer="3336" to-port="1" /> <edge from-layer="3336" from-port="2" to-layer="3337" to-port="0" /> <edge from-layer="3337" from-port="1" to-layer="3348" to-port="0" /> <edge from-layer="3338" from-port="0" to-layer="3339" to-port="0" /> <edge from-layer="3339" from-port="1" to-layer="3342" to-port="0" /> <edge from-layer="3340" from-port="0" to-layer="3341" to-port="0" /> <edge from-layer="3341" from-port="1" to-layer="3342" to-port="1" /> <edge from-layer="3342" from-port="2" to-layer="3344" to-port="0" /> <edge from-layer="3343" from-port="0" to-layer="3344" to-port="1" /> <edge from-layer="3344" from-port="2" to-layer="3346" to-port="0" /> <edge from-layer="3345" from-port="0" to-layer="3346" to-port="1" /> <edge from-layer="3346" from-port="2" to-layer="3347" to-port="0" /> <edge from-layer="3347" from-port="1" to-layer="3348" to-port="1" /> <edge from-layer="3348" from-port="2" to-layer="3350" to-port="0" /> <edge from-layer="3349" from-port="0" to-layer="3350" to-port="1" /> <edge from-layer="3350" from-port="2" to-layer="3351" to-port="1" /> <edge from-layer="3351" from-port="2" to-layer="3353" to-port="0" /> <edge from-layer="3351" from-port="2" to-layer="3445" to-port="0" /> <edge from-layer="3352" from-port="0" to-layer="3353" to-port="1" /> <edge from-layer="3353" from-port="2" to-layer="3355" to-port="0" /> <edge from-layer="3354" from-port="0" to-layer="3355" to-port="1" /> <edge from-layer="3355" from-port="2" to-layer="3357" to-port="0" /> <edge from-layer="3356" from-port="0" to-layer="3357" to-port="1" /> <edge from-layer="3357" from-port="2" to-layer="3419" to-port="0" /> <edge from-layer="3357" from-port="2" to-layer="3368" to-port="0" /> <edge from-layer="3357" from-port="2" to-layer="3394" to-port="0" /> <edge from-layer="3358" from-port="0" to-layer="3359" to-port="0" /> <edge from-layer="3359" from-port="1" to-layer="3362" to-port="0" /> <edge from-layer="3360" from-port="0" to-layer="3361" to-port="0" /> <edge from-layer="3361" from-port="1" to-layer="3362" to-port="1" /> <edge from-layer="3362" from-port="2" to-layer="3364" to-port="0" /> <edge from-layer="3363" from-port="0" to-layer="3364" to-port="1" /> <edge from-layer="3364" from-port="2" to-layer="3366" to-port="0" /> <edge from-layer="3365" from-port="0" to-layer="3366" to-port="1" /> <edge from-layer="3366" from-port="2" to-layer="3367" to-port="0" /> <edge from-layer="3367" from-port="1" to-layer="3368" to-port="1" /> <edge from-layer="3368" from-port="2" to-layer="3370" to-port="0" /> <edge from-layer="3369" from-port="0" to-layer="3370" to-port="1" /> <edge from-layer="3370" from-port="2" to-layer="3372" to-port="0" /> <edge from-layer="3371" from-port="0" to-layer="3372" to-port="1" /> <edge from-layer="3372" from-port="2" to-layer="3374" to-port="0" /> <edge from-layer="3373" from-port="0" to-layer="3374" to-port="1" /> <edge from-layer="3374" from-port="2" to-layer="3427" to-port="0" /> <edge from-layer="3375" from-port="0" to-layer="3380" to-port="0" /> <edge from-layer="3376" from-port="0" to-layer="3379" to-port="1" /> <edge from-layer="3377" from-port="0" to-layer="3379" to-port="2" /> <edge from-layer="3378" from-port="0" to-layer="3379" to-port="3" /> <edge from-layer="3379" from-port="4" to-layer="3380" to-port="1" /> <edge from-layer="3380" from-port="2" to-layer="3381" to-port="0" /> <edge from-layer="3381" from-port="1" to-layer="3383" to-port="0" /> <edge from-layer="3382" from-port="0" to-layer="3383" to-port="2" /> <edge from-layer="3383" from-port="3" to-layer="3399" to-port="0" /> <edge from-layer="3384" from-port="0" to-layer="3385" to-port="0" /> <edge from-layer="3385" from-port="1" to-layer="3388" to-port="0" /> <edge from-layer="3386" from-port="0" to-layer="3387" to-port="0" /> <edge from-layer="3387" from-port="1" to-layer="3388" to-port="1" /> <edge from-layer="3388" from-port="2" to-layer="3390" to-port="0" /> <edge from-layer="3389" from-port="0" to-layer="3390" to-port="1" /> <edge from-layer="3390" from-port="2" to-layer="3392" to-port="0" /> <edge from-layer="3391" from-port="0" to-layer="3392" to-port="1" /> <edge from-layer="3392" from-port="2" to-layer="3393" to-port="0" /> <edge from-layer="3393" from-port="1" to-layer="3394" to-port="1" /> <edge from-layer="3394" from-port="2" to-layer="3396" to-port="0" /> <edge from-layer="3395" from-port="0" to-layer="3396" to-port="1" /> <edge from-layer="3396" from-port="2" to-layer="3398" to-port="0" /> <edge from-layer="3397" from-port="0" to-layer="3398" to-port="1" /> <edge from-layer="3398" from-port="2" to-layer="3399" to-port="1" /> <edge from-layer="3399" from-port="2" to-layer="4952" to-port="0" /> <edge from-layer="3399" from-port="2" to-layer="3427" to-port="1" /> <edge from-layer="3400" from-port="0" to-layer="3405" to-port="0" /> <edge from-layer="3401" from-port="0" to-layer="3404" to-port="1" /> <edge from-layer="3402" from-port="0" to-layer="3404" to-port="2" /> <edge from-layer="3403" from-port="0" to-layer="3404" to-port="3" /> <edge from-layer="3404" from-port="4" to-layer="3405" to-port="1" /> <edge from-layer="3405" from-port="2" to-layer="3406" to-port="0" /> <edge from-layer="3406" from-port="1" to-layer="3408" to-port="0" /> <edge from-layer="3407" from-port="0" to-layer="3408" to-port="2" /> <edge from-layer="3408" from-port="3" to-layer="3426" to-port="0" /> <edge from-layer="3409" from-port="0" to-layer="3410" to-port="0" /> <edge from-layer="3410" from-port="1" to-layer="3413" to-port="0" /> <edge from-layer="3411" from-port="0" to-layer="3412" to-port="0" /> <edge from-layer="3412" from-port="1" to-layer="3413" to-port="1" /> <edge from-layer="3413" from-port="2" to-layer="3415" to-port="0" /> <edge from-layer="3414" from-port="0" to-layer="3415" to-port="1" /> <edge from-layer="3415" from-port="2" to-layer="3417" to-port="0" /> <edge from-layer="3416" from-port="0" to-layer="3417" to-port="1" /> <edge from-layer="3417" from-port="2" to-layer="3418" to-port="0" /> <edge from-layer="3418" from-port="1" to-layer="3419" to-port="1" /> <edge from-layer="3419" from-port="2" to-layer="3421" to-port="0" /> <edge from-layer="3420" from-port="0" to-layer="3421" to-port="1" /> <edge from-layer="3421" from-port="2" to-layer="3423" to-port="0" /> <edge from-layer="3422" from-port="0" to-layer="3423" to-port="1" /> <edge from-layer="3423" from-port="2" to-layer="3425" to-port="0" /> <edge from-layer="3424" from-port="0" to-layer="3425" to-port="1" /> <edge from-layer="3425" from-port="2" to-layer="3426" to-port="1" /> <edge from-layer="3426" from-port="2" to-layer="4951" to-port="0" /> <edge from-layer="3426" from-port="2" to-layer="3427" to-port="2" /> <edge from-layer="3427" from-port="4" to-layer="3429" to-port="0" /> <edge from-layer="3428" from-port="0" to-layer="3429" to-port="1" /> <edge from-layer="3429" from-port="2" to-layer="3431" to-port="0" /> <edge from-layer="3430" from-port="0" to-layer="3431" to-port="1" /> <edge from-layer="3431" from-port="2" to-layer="3442" to-port="0" /> <edge from-layer="3432" from-port="0" to-layer="3433" to-port="0" /> <edge from-layer="3433" from-port="1" to-layer="3436" to-port="0" /> <edge from-layer="3434" from-port="0" to-layer="3435" to-port="0" /> <edge from-layer="3435" from-port="1" to-layer="3436" to-port="1" /> <edge from-layer="3436" from-port="2" to-layer="3438" to-port="0" /> <edge from-layer="3437" from-port="0" to-layer="3438" to-port="1" /> <edge from-layer="3438" from-port="2" to-layer="3440" to-port="0" /> <edge from-layer="3439" from-port="0" to-layer="3440" to-port="1" /> <edge from-layer="3440" from-port="2" to-layer="3441" to-port="0" /> <edge from-layer="3441" from-port="1" to-layer="3442" to-port="1" /> <edge from-layer="3442" from-port="2" to-layer="3444" to-port="0" /> <edge from-layer="3443" from-port="0" to-layer="3444" to-port="1" /> <edge from-layer="3444" from-port="2" to-layer="3445" to-port="1" /> <edge from-layer="3445" from-port="2" to-layer="3447" to-port="0" /> <edge from-layer="3445" from-port="2" to-layer="3487" to-port="0" /> <edge from-layer="3446" from-port="0" to-layer="3447" to-port="1" /> <edge from-layer="3447" from-port="2" to-layer="3449" to-port="0" /> <edge from-layer="3448" from-port="0" to-layer="3449" to-port="1" /> <edge from-layer="3449" from-port="2" to-layer="3451" to-port="0" /> <edge from-layer="3450" from-port="0" to-layer="3451" to-port="1" /> <edge from-layer="3451" from-port="2" to-layer="3462" to-port="0" /> <edge from-layer="3452" from-port="0" to-layer="3453" to-port="0" /> <edge from-layer="3453" from-port="1" to-layer="3456" to-port="0" /> <edge from-layer="3454" from-port="0" to-layer="3455" to-port="0" /> <edge from-layer="3455" from-port="1" to-layer="3456" to-port="1" /> <edge from-layer="3456" from-port="2" to-layer="3458" to-port="0" /> <edge from-layer="3457" from-port="0" to-layer="3458" to-port="1" /> <edge from-layer="3458" from-port="2" to-layer="3460" to-port="0" /> <edge from-layer="3459" from-port="0" to-layer="3460" to-port="1" /> <edge from-layer="3460" from-port="2" to-layer="3461" to-port="0" /> <edge from-layer="3461" from-port="1" to-layer="3462" to-port="1" /> <edge from-layer="3462" from-port="2" to-layer="3464" to-port="0" /> <edge from-layer="3463" from-port="0" to-layer="3464" to-port="1" /> <edge from-layer="3464" from-port="2" to-layer="3466" to-port="0" /> <edge from-layer="3465" from-port="0" to-layer="3466" to-port="1" /> <edge from-layer="3466" from-port="2" to-layer="3468" to-port="0" /> <edge from-layer="3467" from-port="0" to-layer="3468" to-port="1" /> <edge from-layer="3468" from-port="2" to-layer="3469" to-port="0" /> <edge from-layer="3469" from-port="3" to-layer="3471" to-port="0" /> <edge from-layer="3470" from-port="0" to-layer="3471" to-port="1" /> <edge from-layer="3471" from-port="2" to-layer="3473" to-port="0" /> <edge from-layer="3472" from-port="0" to-layer="3473" to-port="1" /> <edge from-layer="3473" from-port="2" to-layer="3484" to-port="0" /> <edge from-layer="3474" from-port="0" to-layer="3475" to-port="0" /> <edge from-layer="3475" from-port="1" to-layer="3478" to-port="0" /> <edge from-layer="3476" from-port="0" to-layer="3477" to-port="0" /> <edge from-layer="3477" from-port="1" to-layer="3478" to-port="1" /> <edge from-layer="3478" from-port="2" to-layer="3480" to-port="0" /> <edge from-layer="3479" from-port="0" to-layer="3480" to-port="1" /> <edge from-layer="3480" from-port="2" to-layer="3482" to-port="0" /> <edge from-layer="3481" from-port="0" to-layer="3482" to-port="1" /> <edge from-layer="3482" from-port="2" to-layer="3483" to-port="0" /> <edge from-layer="3483" from-port="1" to-layer="3484" to-port="1" /> <edge from-layer="3484" from-port="2" to-layer="3486" to-port="0" /> <edge from-layer="3485" from-port="0" to-layer="3486" to-port="1" /> <edge from-layer="3486" from-port="2" to-layer="3487" to-port="1" /> <edge from-layer="3487" from-port="2" to-layer="3521" to-port="0" /> <edge from-layer="3487" from-port="2" to-layer="3489" to-port="0" /> <edge from-layer="3488" from-port="0" to-layer="3489" to-port="1" /> <edge from-layer="3489" from-port="2" to-layer="3491" to-port="0" /> <edge from-layer="3490" from-port="0" to-layer="3491" to-port="1" /> <edge from-layer="3491" from-port="2" to-layer="3493" to-port="0" /> <edge from-layer="3492" from-port="0" to-layer="3493" to-port="1" /> <edge from-layer="3493" from-port="2" to-layer="3504" to-port="0" /> <edge from-layer="3494" from-port="0" to-layer="3495" to-port="0" /> <edge from-layer="3495" from-port="1" to-layer="3498" to-port="0" /> <edge from-layer="3496" from-port="0" to-layer="3497" to-port="0" /> <edge from-layer="3497" from-port="1" to-layer="3498" to-port="1" /> <edge from-layer="3498" from-port="2" to-layer="3500" to-port="0" /> <edge from-layer="3499" from-port="0" to-layer="3500" to-port="1" /> <edge from-layer="3500" from-port="2" to-layer="3502" to-port="0" /> <edge from-layer="3501" from-port="0" to-layer="3502" to-port="1" /> <edge from-layer="3502" from-port="2" to-layer="3503" to-port="0" /> <edge from-layer="3503" from-port="1" to-layer="3504" to-port="1" /> <edge from-layer="3504" from-port="2" to-layer="3506" to-port="0" /> <edge from-layer="3505" from-port="0" to-layer="3506" to-port="1" /> <edge from-layer="3506" from-port="2" to-layer="3507" to-port="0" /> <edge from-layer="3507" from-port="1" to-layer="3518" to-port="0" /> <edge from-layer="3508" from-port="0" to-layer="3509" to-port="0" /> <edge from-layer="3509" from-port="1" to-layer="3512" to-port="0" /> <edge from-layer="3510" from-port="0" to-layer="3511" to-port="0" /> <edge from-layer="3511" from-port="1" to-layer="3512" to-port="1" /> <edge from-layer="3512" from-port="2" to-layer="3514" to-port="0" /> <edge from-layer="3513" from-port="0" to-layer="3514" to-port="1" /> <edge from-layer="3514" from-port="2" to-layer="3516" to-port="0" /> <edge from-layer="3515" from-port="0" to-layer="3516" to-port="1" /> <edge from-layer="3516" from-port="2" to-layer="3517" to-port="0" /> <edge from-layer="3517" from-port="1" to-layer="3518" to-port="1" /> <edge from-layer="3518" from-port="2" to-layer="3520" to-port="0" /> <edge from-layer="3519" from-port="0" to-layer="3520" to-port="1" /> <edge from-layer="3520" from-port="2" to-layer="3521" to-port="1" /> <edge from-layer="3521" from-port="2" to-layer="3615" to-port="0" /> <edge from-layer="3521" from-port="2" to-layer="3523" to-port="0" /> <edge from-layer="3522" from-port="0" to-layer="3523" to-port="1" /> <edge from-layer="3523" from-port="2" to-layer="3525" to-port="0" /> <edge from-layer="3524" from-port="0" to-layer="3525" to-port="1" /> <edge from-layer="3525" from-port="2" to-layer="3527" to-port="0" /> <edge from-layer="3526" from-port="0" to-layer="3527" to-port="1" /> <edge from-layer="3527" from-port="2" to-layer="3589" to-port="0" /> <edge from-layer="3527" from-port="2" to-layer="3538" to-port="0" /> <edge from-layer="3527" from-port="2" to-layer="3564" to-port="0" /> <edge from-layer="3528" from-port="0" to-layer="3529" to-port="0" /> <edge from-layer="3529" from-port="1" to-layer="3532" to-port="0" /> <edge from-layer="3530" from-port="0" to-layer="3531" to-port="0" /> <edge from-layer="3531" from-port="1" to-layer="3532" to-port="1" /> <edge from-layer="3532" from-port="2" to-layer="3534" to-port="0" /> <edge from-layer="3533" from-port="0" to-layer="3534" to-port="1" /> <edge from-layer="3534" from-port="2" to-layer="3536" to-port="0" /> <edge from-layer="3535" from-port="0" to-layer="3536" to-port="1" /> <edge from-layer="3536" from-port="2" to-layer="3537" to-port="0" /> <edge from-layer="3537" from-port="1" to-layer="3538" to-port="1" /> <edge from-layer="3538" from-port="2" to-layer="3540" to-port="0" /> <edge from-layer="3539" from-port="0" to-layer="3540" to-port="1" /> <edge from-layer="3540" from-port="2" to-layer="3542" to-port="0" /> <edge from-layer="3541" from-port="0" to-layer="3542" to-port="1" /> <edge from-layer="3542" from-port="2" to-layer="3544" to-port="0" /> <edge from-layer="3543" from-port="0" to-layer="3544" to-port="1" /> <edge from-layer="3544" from-port="2" to-layer="3597" to-port="0" /> <edge from-layer="3545" from-port="0" to-layer="3550" to-port="0" /> <edge from-layer="3546" from-port="0" to-layer="3549" to-port="1" /> <edge from-layer="3547" from-port="0" to-layer="3549" to-port="2" /> <edge from-layer="3548" from-port="0" to-layer="3549" to-port="3" /> <edge from-layer="3549" from-port="4" to-layer="3550" to-port="1" /> <edge from-layer="3550" from-port="2" to-layer="3551" to-port="0" /> <edge from-layer="3551" from-port="1" to-layer="3553" to-port="0" /> <edge from-layer="3552" from-port="0" to-layer="3553" to-port="2" /> <edge from-layer="3553" from-port="3" to-layer="3569" to-port="0" /> <edge from-layer="3554" from-port="0" to-layer="3555" to-port="0" /> <edge from-layer="3555" from-port="1" to-layer="3558" to-port="0" /> <edge from-layer="3556" from-port="0" to-layer="3557" to-port="0" /> <edge from-layer="3557" from-port="1" to-layer="3558" to-port="1" /> <edge from-layer="3558" from-port="2" to-layer="3560" to-port="0" /> <edge from-layer="3559" from-port="0" to-layer="3560" to-port="1" /> <edge from-layer="3560" from-port="2" to-layer="3562" to-port="0" /> <edge from-layer="3561" from-port="0" to-layer="3562" to-port="1" /> <edge from-layer="3562" from-port="2" to-layer="3563" to-port="0" /> <edge from-layer="3563" from-port="1" to-layer="3564" to-port="1" /> <edge from-layer="3564" from-port="2" to-layer="3566" to-port="0" /> <edge from-layer="3565" from-port="0" to-layer="3566" to-port="1" /> <edge from-layer="3566" from-port="2" to-layer="3568" to-port="0" /> <edge from-layer="3567" from-port="0" to-layer="3568" to-port="1" /> <edge from-layer="3568" from-port="2" to-layer="3569" to-port="1" /> <edge from-layer="3569" from-port="2" to-layer="3597" to-port="1" /> <edge from-layer="3569" from-port="2" to-layer="4950" to-port="0" /> <edge from-layer="3570" from-port="0" to-layer="3575" to-port="0" /> <edge from-layer="3571" from-port="0" to-layer="3574" to-port="1" /> <edge from-layer="3572" from-port="0" to-layer="3574" to-port="2" /> <edge from-layer="3573" from-port="0" to-layer="3574" to-port="3" /> <edge from-layer="3574" from-port="4" to-layer="3575" to-port="1" /> <edge from-layer="3575" from-port="2" to-layer="3576" to-port="0" /> <edge from-layer="3576" from-port="1" to-layer="3578" to-port="0" /> <edge from-layer="3577" from-port="0" to-layer="3578" to-port="2" /> <edge from-layer="3578" from-port="3" to-layer="3596" to-port="0" /> <edge from-layer="3579" from-port="0" to-layer="3580" to-port="0" /> <edge from-layer="3580" from-port="1" to-layer="3583" to-port="0" /> <edge from-layer="3581" from-port="0" to-layer="3582" to-port="0" /> <edge from-layer="3582" from-port="1" to-layer="3583" to-port="1" /> <edge from-layer="3583" from-port="2" to-layer="3585" to-port="0" /> <edge from-layer="3584" from-port="0" to-layer="3585" to-port="1" /> <edge from-layer="3585" from-port="2" to-layer="3587" to-port="0" /> <edge from-layer="3586" from-port="0" to-layer="3587" to-port="1" /> <edge from-layer="3587" from-port="2" to-layer="3588" to-port="0" /> <edge from-layer="3588" from-port="1" to-layer="3589" to-port="1" /> <edge from-layer="3589" from-port="2" to-layer="3591" to-port="0" /> <edge from-layer="3590" from-port="0" to-layer="3591" to-port="1" /> <edge from-layer="3591" from-port="2" to-layer="3593" to-port="0" /> <edge from-layer="3592" from-port="0" to-layer="3593" to-port="1" /> <edge from-layer="3593" from-port="2" to-layer="3595" to-port="0" /> <edge from-layer="3594" from-port="0" to-layer="3595" to-port="1" /> <edge from-layer="3595" from-port="2" to-layer="3596" to-port="1" /> <edge from-layer="3596" from-port="2" to-layer="3597" to-port="2" /> <edge from-layer="3596" from-port="2" to-layer="4949" to-port="0" /> <edge from-layer="3597" from-port="4" to-layer="3599" to-port="0" /> <edge from-layer="3598" from-port="0" to-layer="3599" to-port="1" /> <edge from-layer="3599" from-port="2" to-layer="3601" to-port="0" /> <edge from-layer="3600" from-port="0" to-layer="3601" to-port="1" /> <edge from-layer="3601" from-port="2" to-layer="3612" to-port="0" /> <edge from-layer="3602" from-port="0" to-layer="3603" to-port="0" /> <edge from-layer="3603" from-port="1" to-layer="3606" to-port="0" /> <edge from-layer="3604" from-port="0" to-layer="3605" to-port="0" /> <edge from-layer="3605" from-port="1" to-layer="3606" to-port="1" /> <edge from-layer="3606" from-port="2" to-layer="3608" to-port="0" /> <edge from-layer="3607" from-port="0" to-layer="3608" to-port="1" /> <edge from-layer="3608" from-port="2" to-layer="3610" to-port="0" /> <edge from-layer="3609" from-port="0" to-layer="3610" to-port="1" /> <edge from-layer="3610" from-port="2" to-layer="3611" to-port="0" /> <edge from-layer="3611" from-port="1" to-layer="3612" to-port="1" /> <edge from-layer="3612" from-port="2" to-layer="3614" to-port="0" /> <edge from-layer="3613" from-port="0" to-layer="3614" to-port="1" /> <edge from-layer="3614" from-port="2" to-layer="3615" to-port="1" /> <edge from-layer="3615" from-port="2" to-layer="3617" to-port="0" /> <edge from-layer="3615" from-port="2" to-layer="3657" to-port="0" /> <edge from-layer="3616" from-port="0" to-layer="3617" to-port="1" /> <edge from-layer="3617" from-port="2" to-layer="3619" to-port="0" /> <edge from-layer="3618" from-port="0" to-layer="3619" to-port="1" /> <edge from-layer="3619" from-port="2" to-layer="3621" to-port="0" /> <edge from-layer="3620" from-port="0" to-layer="3621" to-port="1" /> <edge from-layer="3621" from-port="2" to-layer="3632" to-port="0" /> <edge from-layer="3622" from-port="0" to-layer="3623" to-port="0" /> <edge from-layer="3623" from-port="1" to-layer="3626" to-port="0" /> <edge from-layer="3624" from-port="0" to-layer="3625" to-port="0" /> <edge from-layer="3625" from-port="1" to-layer="3626" to-port="1" /> <edge from-layer="3626" from-port="2" to-layer="3628" to-port="0" /> <edge from-layer="3627" from-port="0" to-layer="3628" to-port="1" /> <edge from-layer="3628" from-port="2" to-layer="3630" to-port="0" /> <edge from-layer="3629" from-port="0" to-layer="3630" to-port="1" /> <edge from-layer="3630" from-port="2" to-layer="3631" to-port="0" /> <edge from-layer="3631" from-port="1" to-layer="3632" to-port="1" /> <edge from-layer="3632" from-port="2" to-layer="3634" to-port="0" /> <edge from-layer="3633" from-port="0" to-layer="3634" to-port="1" /> <edge from-layer="3634" from-port="2" to-layer="3636" to-port="0" /> <edge from-layer="3635" from-port="0" to-layer="3636" to-port="1" /> <edge from-layer="3636" from-port="2" to-layer="3638" to-port="0" /> <edge from-layer="3637" from-port="0" to-layer="3638" to-port="1" /> <edge from-layer="3638" from-port="2" to-layer="3639" to-port="0" /> <edge from-layer="3639" from-port="3" to-layer="3641" to-port="0" /> <edge from-layer="3640" from-port="0" to-layer="3641" to-port="1" /> <edge from-layer="3641" from-port="2" to-layer="3643" to-port="0" /> <edge from-layer="3642" from-port="0" to-layer="3643" to-port="1" /> <edge from-layer="3643" from-port="2" to-layer="3654" to-port="0" /> <edge from-layer="3644" from-port="0" to-layer="3645" to-port="0" /> <edge from-layer="3645" from-port="1" to-layer="3648" to-port="0" /> <edge from-layer="3646" from-port="0" to-layer="3647" to-port="0" /> <edge from-layer="3647" from-port="1" to-layer="3648" to-port="1" /> <edge from-layer="3648" from-port="2" to-layer="3650" to-port="0" /> <edge from-layer="3649" from-port="0" to-layer="3650" to-port="1" /> <edge from-layer="3650" from-port="2" to-layer="3652" to-port="0" /> <edge from-layer="3651" from-port="0" to-layer="3652" to-port="1" /> <edge from-layer="3652" from-port="2" to-layer="3653" to-port="0" /> <edge from-layer="3653" from-port="1" to-layer="3654" to-port="1" /> <edge from-layer="3654" from-port="2" to-layer="3656" to-port="0" /> <edge from-layer="3655" from-port="0" to-layer="3656" to-port="1" /> <edge from-layer="3656" from-port="2" to-layer="3657" to-port="1" /> <edge from-layer="3657" from-port="2" to-layer="3659" to-port="0" /> <edge from-layer="3657" from-port="2" to-layer="3691" to-port="0" /> <edge from-layer="3658" from-port="0" to-layer="3659" to-port="1" /> <edge from-layer="3659" from-port="2" to-layer="3661" to-port="0" /> <edge from-layer="3660" from-port="0" to-layer="3661" to-port="1" /> <edge from-layer="3661" from-port="2" to-layer="3663" to-port="0" /> <edge from-layer="3662" from-port="0" to-layer="3663" to-port="1" /> <edge from-layer="3663" from-port="2" to-layer="3674" to-port="0" /> <edge from-layer="3664" from-port="0" to-layer="3665" to-port="0" /> <edge from-layer="3665" from-port="1" to-layer="3668" to-port="0" /> <edge from-layer="3666" from-port="0" to-layer="3667" to-port="0" /> <edge from-layer="3667" from-port="1" to-layer="3668" to-port="1" /> <edge from-layer="3668" from-port="2" to-layer="3670" to-port="0" /> <edge from-layer="3669" from-port="0" to-layer="3670" to-port="1" /> <edge from-layer="3670" from-port="2" to-layer="3672" to-port="0" /> <edge from-layer="3671" from-port="0" to-layer="3672" to-port="1" /> <edge from-layer="3672" from-port="2" to-layer="3673" to-port="0" /> <edge from-layer="3673" from-port="1" to-layer="3674" to-port="1" /> <edge from-layer="3674" from-port="2" to-layer="3676" to-port="0" /> <edge from-layer="3675" from-port="0" to-layer="3676" to-port="1" /> <edge from-layer="3676" from-port="2" to-layer="3677" to-port="0" /> <edge from-layer="3677" from-port="1" to-layer="3688" to-port="0" /> <edge from-layer="3678" from-port="0" to-layer="3679" to-port="0" /> <edge from-layer="3679" from-port="1" to-layer="3682" to-port="0" /> <edge from-layer="3680" from-port="0" to-layer="3681" to-port="0" /> <edge from-layer="3681" from-port="1" to-layer="3682" to-port="1" /> <edge from-layer="3682" from-port="2" to-layer="3684" to-port="0" /> <edge from-layer="3683" from-port="0" to-layer="3684" to-port="1" /> <edge from-layer="3684" from-port="2" to-layer="3686" to-port="0" /> <edge from-layer="3685" from-port="0" to-layer="3686" to-port="1" /> <edge from-layer="3686" from-port="2" to-layer="3687" to-port="0" /> <edge from-layer="3687" from-port="1" to-layer="3688" to-port="1" /> <edge from-layer="3688" from-port="2" to-layer="3690" to-port="0" /> <edge from-layer="3689" from-port="0" to-layer="3690" to-port="1" /> <edge from-layer="3690" from-port="2" to-layer="3691" to-port="1" /> <edge from-layer="3691" from-port="2" to-layer="3693" to-port="0" /> <edge from-layer="3691" from-port="2" to-layer="3785" to-port="0" /> <edge from-layer="3692" from-port="0" to-layer="3693" to-port="1" /> <edge from-layer="3693" from-port="2" to-layer="3695" to-port="0" /> <edge from-layer="3694" from-port="0" to-layer="3695" to-port="1" /> <edge from-layer="3695" from-port="2" to-layer="3697" to-port="0" /> <edge from-layer="3696" from-port="0" to-layer="3697" to-port="1" /> <edge from-layer="3697" from-port="2" to-layer="3708" to-port="0" /> <edge from-layer="3697" from-port="2" to-layer="3759" to-port="0" /> <edge from-layer="3697" from-port="2" to-layer="3734" to-port="0" /> <edge from-layer="3698" from-port="0" to-layer="3699" to-port="0" /> <edge from-layer="3699" from-port="1" to-layer="3702" to-port="0" /> <edge from-layer="3700" from-port="0" to-layer="3701" to-port="0" /> <edge from-layer="3701" from-port="1" to-layer="3702" to-port="1" /> <edge from-layer="3702" from-port="2" to-layer="3704" to-port="0" /> <edge from-layer="3703" from-port="0" to-layer="3704" to-port="1" /> <edge from-layer="3704" from-port="2" to-layer="3706" to-port="0" /> <edge from-layer="3705" from-port="0" to-layer="3706" to-port="1" /> <edge from-layer="3706" from-port="2" to-layer="3707" to-port="0" /> <edge from-layer="3707" from-port="1" to-layer="3708" to-port="1" /> <edge from-layer="3708" from-port="2" to-layer="3710" to-port="0" /> <edge from-layer="3709" from-port="0" to-layer="3710" to-port="1" /> <edge from-layer="3710" from-port="2" to-layer="3712" to-port="0" /> <edge from-layer="3711" from-port="0" to-layer="3712" to-port="1" /> <edge from-layer="3712" from-port="2" to-layer="3714" to-port="0" /> <edge from-layer="3713" from-port="0" to-layer="3714" to-port="1" /> <edge from-layer="3714" from-port="2" to-layer="3767" to-port="0" /> <edge from-layer="3715" from-port="0" to-layer="3720" to-port="0" /> <edge from-layer="3716" from-port="0" to-layer="3719" to-port="1" /> <edge from-layer="3717" from-port="0" to-layer="3719" to-port="2" /> <edge from-layer="3718" from-port="0" to-layer="3719" to-port="3" /> <edge from-layer="3719" from-port="4" to-layer="3720" to-port="1" /> <edge from-layer="3720" from-port="2" to-layer="3721" to-port="0" /> <edge from-layer="3721" from-port="1" to-layer="3723" to-port="0" /> <edge from-layer="3722" from-port="0" to-layer="3723" to-port="2" /> <edge from-layer="3723" from-port="3" to-layer="3739" to-port="0" /> <edge from-layer="3724" from-port="0" to-layer="3725" to-port="0" /> <edge from-layer="3725" from-port="1" to-layer="3728" to-port="0" /> <edge from-layer="3726" from-port="0" to-layer="3727" to-port="0" /> <edge from-layer="3727" from-port="1" to-layer="3728" to-port="1" /> <edge from-layer="3728" from-port="2" to-layer="3730" to-port="0" /> <edge from-layer="3729" from-port="0" to-layer="3730" to-port="1" /> <edge from-layer="3730" from-port="2" to-layer="3732" to-port="0" /> <edge from-layer="3731" from-port="0" to-layer="3732" to-port="1" /> <edge from-layer="3732" from-port="2" to-layer="3733" to-port="0" /> <edge from-layer="3733" from-port="1" to-layer="3734" to-port="1" /> <edge from-layer="3734" from-port="2" to-layer="3736" to-port="0" /> <edge from-layer="3735" from-port="0" to-layer="3736" to-port="1" /> <edge from-layer="3736" from-port="2" to-layer="3738" to-port="0" /> <edge from-layer="3737" from-port="0" to-layer="3738" to-port="1" /> <edge from-layer="3738" from-port="2" to-layer="3739" to-port="1" /> <edge from-layer="3739" from-port="2" to-layer="3767" to-port="1" /> <edge from-layer="3739" from-port="2" to-layer="4948" to-port="0" /> <edge from-layer="3740" from-port="0" to-layer="3745" to-port="0" /> <edge from-layer="3741" from-port="0" to-layer="3744" to-port="1" /> <edge from-layer="3742" from-port="0" to-layer="3744" to-port="2" /> <edge from-layer="3743" from-port="0" to-layer="3744" to-port="3" /> <edge from-layer="3744" from-port="4" to-layer="3745" to-port="1" /> <edge from-layer="3745" from-port="2" to-layer="3746" to-port="0" /> <edge from-layer="3746" from-port="1" to-layer="3748" to-port="0" /> <edge from-layer="3747" from-port="0" to-layer="3748" to-port="2" /> <edge from-layer="3748" from-port="3" to-layer="3766" to-port="0" /> <edge from-layer="3749" from-port="0" to-layer="3750" to-port="0" /> <edge from-layer="3750" from-port="1" to-layer="3753" to-port="0" /> <edge from-layer="3751" from-port="0" to-layer="3752" to-port="0" /> <edge from-layer="3752" from-port="1" to-layer="3753" to-port="1" /> <edge from-layer="3753" from-port="2" to-layer="3755" to-port="0" /> <edge from-layer="3754" from-port="0" to-layer="3755" to-port="1" /> <edge from-layer="3755" from-port="2" to-layer="3757" to-port="0" /> <edge from-layer="3756" from-port="0" to-layer="3757" to-port="1" /> <edge from-layer="3757" from-port="2" to-layer="3758" to-port="0" /> <edge from-layer="3758" from-port="1" to-layer="3759" to-port="1" /> <edge from-layer="3759" from-port="2" to-layer="3761" to-port="0" /> <edge from-layer="3760" from-port="0" to-layer="3761" to-port="1" /> <edge from-layer="3761" from-port="2" to-layer="3763" to-port="0" /> <edge from-layer="3762" from-port="0" to-layer="3763" to-port="1" /> <edge from-layer="3763" from-port="2" to-layer="3765" to-port="0" /> <edge from-layer="3764" from-port="0" to-layer="3765" to-port="1" /> <edge from-layer="3765" from-port="2" to-layer="3766" to-port="1" /> <edge from-layer="3766" from-port="2" to-layer="4947" to-port="0" /> <edge from-layer="3766" from-port="2" to-layer="3767" to-port="2" /> <edge from-layer="3767" from-port="4" to-layer="3769" to-port="0" /> <edge from-layer="3768" from-port="0" to-layer="3769" to-port="1" /> <edge from-layer="3769" from-port="2" to-layer="3771" to-port="0" /> <edge from-layer="3770" from-port="0" to-layer="3771" to-port="1" /> <edge from-layer="3771" from-port="2" to-layer="3782" to-port="0" /> <edge from-layer="3772" from-port="0" to-layer="3773" to-port="0" /> <edge from-layer="3773" from-port="1" to-layer="3776" to-port="0" /> <edge from-layer="3774" from-port="0" to-layer="3775" to-port="0" /> <edge from-layer="3775" from-port="1" to-layer="3776" to-port="1" /> <edge from-layer="3776" from-port="2" to-layer="3778" to-port="0" /> <edge from-layer="3777" from-port="0" to-layer="3778" to-port="1" /> <edge from-layer="3778" from-port="2" to-layer="3780" to-port="0" /> <edge from-layer="3779" from-port="0" to-layer="3780" to-port="1" /> <edge from-layer="3780" from-port="2" to-layer="3781" to-port="0" /> <edge from-layer="3781" from-port="1" to-layer="3782" to-port="1" /> <edge from-layer="3782" from-port="2" to-layer="3784" to-port="0" /> <edge from-layer="3783" from-port="0" to-layer="3784" to-port="1" /> <edge from-layer="3784" from-port="2" to-layer="3785" to-port="1" /> <edge from-layer="3785" from-port="2" to-layer="3787" to-port="0" /> <edge from-layer="3785" from-port="2" to-layer="3827" to-port="0" /> <edge from-layer="3786" from-port="0" to-layer="3787" to-port="1" /> <edge from-layer="3787" from-port="2" to-layer="3789" to-port="0" /> <edge from-layer="3788" from-port="0" to-layer="3789" to-port="1" /> <edge from-layer="3789" from-port="2" to-layer="3791" to-port="0" /> <edge from-layer="3790" from-port="0" to-layer="3791" to-port="1" /> <edge from-layer="3791" from-port="2" to-layer="3802" to-port="0" /> <edge from-layer="3792" from-port="0" to-layer="3793" to-port="0" /> <edge from-layer="3793" from-port="1" to-layer="3796" to-port="0" /> <edge from-layer="3794" from-port="0" to-layer="3795" to-port="0" /> <edge from-layer="3795" from-port="1" to-layer="3796" to-port="1" /> <edge from-layer="3796" from-port="2" to-layer="3798" to-port="0" /> <edge from-layer="3797" from-port="0" to-layer="3798" to-port="1" /> <edge from-layer="3798" from-port="2" to-layer="3800" to-port="0" /> <edge from-layer="3799" from-port="0" to-layer="3800" to-port="1" /> <edge from-layer="3800" from-port="2" to-layer="3801" to-port="0" /> <edge from-layer="3801" from-port="1" to-layer="3802" to-port="1" /> <edge from-layer="3802" from-port="2" to-layer="3804" to-port="0" /> <edge from-layer="3803" from-port="0" to-layer="3804" to-port="1" /> <edge from-layer="3804" from-port="2" to-layer="3806" to-port="0" /> <edge from-layer="3805" from-port="0" to-layer="3806" to-port="1" /> <edge from-layer="3806" from-port="2" to-layer="3808" to-port="0" /> <edge from-layer="3807" from-port="0" to-layer="3808" to-port="1" /> <edge from-layer="3808" from-port="2" to-layer="3809" to-port="0" /> <edge from-layer="3809" from-port="3" to-layer="3811" to-port="0" /> <edge from-layer="3810" from-port="0" to-layer="3811" to-port="1" /> <edge from-layer="3811" from-port="2" to-layer="3813" to-port="0" /> <edge from-layer="3812" from-port="0" to-layer="3813" to-port="1" /> <edge from-layer="3813" from-port="2" to-layer="3824" to-port="0" /> <edge from-layer="3814" from-port="0" to-layer="3815" to-port="0" /> <edge from-layer="3815" from-port="1" to-layer="3818" to-port="0" /> <edge from-layer="3816" from-port="0" to-layer="3817" to-port="0" /> <edge from-layer="3817" from-port="1" to-layer="3818" to-port="1" /> <edge from-layer="3818" from-port="2" to-layer="3820" to-port="0" /> <edge from-layer="3819" from-port="0" to-layer="3820" to-port="1" /> <edge from-layer="3820" from-port="2" to-layer="3822" to-port="0" /> <edge from-layer="3821" from-port="0" to-layer="3822" to-port="1" /> <edge from-layer="3822" from-port="2" to-layer="3823" to-port="0" /> <edge from-layer="3823" from-port="1" to-layer="3824" to-port="1" /> <edge from-layer="3824" from-port="2" to-layer="3826" to-port="0" /> <edge from-layer="3825" from-port="0" to-layer="3826" to-port="1" /> <edge from-layer="3826" from-port="2" to-layer="3827" to-port="1" /> <edge from-layer="3827" from-port="2" to-layer="3861" to-port="0" /> <edge from-layer="3827" from-port="2" to-layer="3829" to-port="0" /> <edge from-layer="3828" from-port="0" to-layer="3829" to-port="1" /> <edge from-layer="3829" from-port="2" to-layer="3831" to-port="0" /> <edge from-layer="3830" from-port="0" to-layer="3831" to-port="1" /> <edge from-layer="3831" from-port="2" to-layer="3833" to-port="0" /> <edge from-layer="3832" from-port="0" to-layer="3833" to-port="1" /> <edge from-layer="3833" from-port="2" to-layer="3844" to-port="0" /> <edge from-layer="3834" from-port="0" to-layer="3835" to-port="0" /> <edge from-layer="3835" from-port="1" to-layer="3838" to-port="0" /> <edge from-layer="3836" from-port="0" to-layer="3837" to-port="0" /> <edge from-layer="3837" from-port="1" to-layer="3838" to-port="1" /> <edge from-layer="3838" from-port="2" to-layer="3840" to-port="0" /> <edge from-layer="3839" from-port="0" to-layer="3840" to-port="1" /> <edge from-layer="3840" from-port="2" to-layer="3842" to-port="0" /> <edge from-layer="3841" from-port="0" to-layer="3842" to-port="1" /> <edge from-layer="3842" from-port="2" to-layer="3843" to-port="0" /> <edge from-layer="3843" from-port="1" to-layer="3844" to-port="1" /> <edge from-layer="3844" from-port="2" to-layer="3846" to-port="0" /> <edge from-layer="3845" from-port="0" to-layer="3846" to-port="1" /> <edge from-layer="3846" from-port="2" to-layer="3847" to-port="0" /> <edge from-layer="3847" from-port="1" to-layer="3858" to-port="0" /> <edge from-layer="3848" from-port="0" to-layer="3849" to-port="0" /> <edge from-layer="3849" from-port="1" to-layer="3852" to-port="0" /> <edge from-layer="3850" from-port="0" to-layer="3851" to-port="0" /> <edge from-layer="3851" from-port="1" to-layer="3852" to-port="1" /> <edge from-layer="3852" from-port="2" to-layer="3854" to-port="0" /> <edge from-layer="3853" from-port="0" to-layer="3854" to-port="1" /> <edge from-layer="3854" from-port="2" to-layer="3856" to-port="0" /> <edge from-layer="3855" from-port="0" to-layer="3856" to-port="1" /> <edge from-layer="3856" from-port="2" to-layer="3857" to-port="0" /> <edge from-layer="3857" from-port="1" to-layer="3858" to-port="1" /> <edge from-layer="3858" from-port="2" to-layer="3860" to-port="0" /> <edge from-layer="3859" from-port="0" to-layer="3860" to-port="1" /> <edge from-layer="3860" from-port="2" to-layer="3861" to-port="1" /> <edge from-layer="3861" from-port="2" to-layer="3955" to-port="0" /> <edge from-layer="3861" from-port="2" to-layer="3863" to-port="0" /> <edge from-layer="3862" from-port="0" to-layer="3863" to-port="1" /> <edge from-layer="3863" from-port="2" to-layer="3865" to-port="0" /> <edge from-layer="3864" from-port="0" to-layer="3865" to-port="1" /> <edge from-layer="3865" from-port="2" to-layer="3867" to-port="0" /> <edge from-layer="3866" from-port="0" to-layer="3867" to-port="1" /> <edge from-layer="3867" from-port="2" to-layer="3904" to-port="0" /> <edge from-layer="3867" from-port="2" to-layer="3929" to-port="0" /> <edge from-layer="3867" from-port="2" to-layer="3878" to-port="0" /> <edge from-layer="3868" from-port="0" to-layer="3869" to-port="0" /> <edge from-layer="3869" from-port="1" to-layer="3872" to-port="0" /> <edge from-layer="3870" from-port="0" to-layer="3871" to-port="0" /> <edge from-layer="3871" from-port="1" to-layer="3872" to-port="1" /> <edge from-layer="3872" from-port="2" to-layer="3874" to-port="0" /> <edge from-layer="3873" from-port="0" to-layer="3874" to-port="1" /> <edge from-layer="3874" from-port="2" to-layer="3876" to-port="0" /> <edge from-layer="3875" from-port="0" to-layer="3876" to-port="1" /> <edge from-layer="3876" from-port="2" to-layer="3877" to-port="0" /> <edge from-layer="3877" from-port="1" to-layer="3878" to-port="1" /> <edge from-layer="3878" from-port="2" to-layer="3880" to-port="0" /> <edge from-layer="3879" from-port="0" to-layer="3880" to-port="1" /> <edge from-layer="3880" from-port="2" to-layer="3882" to-port="0" /> <edge from-layer="3881" from-port="0" to-layer="3882" to-port="1" /> <edge from-layer="3882" from-port="2" to-layer="3884" to-port="0" /> <edge from-layer="3883" from-port="0" to-layer="3884" to-port="1" /> <edge from-layer="3884" from-port="2" to-layer="3937" to-port="0" /> <edge from-layer="3885" from-port="0" to-layer="3890" to-port="0" /> <edge from-layer="3886" from-port="0" to-layer="3889" to-port="1" /> <edge from-layer="3887" from-port="0" to-layer="3889" to-port="2" /> <edge from-layer="3888" from-port="0" to-layer="3889" to-port="3" /> <edge from-layer="3889" from-port="4" to-layer="3890" to-port="1" /> <edge from-layer="3890" from-port="2" to-layer="3891" to-port="0" /> <edge from-layer="3891" from-port="1" to-layer="3893" to-port="0" /> <edge from-layer="3892" from-port="0" to-layer="3893" to-port="2" /> <edge from-layer="3893" from-port="3" to-layer="3909" to-port="0" /> <edge from-layer="3894" from-port="0" to-layer="3895" to-port="0" /> <edge from-layer="3895" from-port="1" to-layer="3898" to-port="0" /> <edge from-layer="3896" from-port="0" to-layer="3897" to-port="0" /> <edge from-layer="3897" from-port="1" to-layer="3898" to-port="1" /> <edge from-layer="3898" from-port="2" to-layer="3900" to-port="0" /> <edge from-layer="3899" from-port="0" to-layer="3900" to-port="1" /> <edge from-layer="3900" from-port="2" to-layer="3902" to-port="0" /> <edge from-layer="3901" from-port="0" to-layer="3902" to-port="1" /> <edge from-layer="3902" from-port="2" to-layer="3903" to-port="0" /> <edge from-layer="3903" from-port="1" to-layer="3904" to-port="1" /> <edge from-layer="3904" from-port="2" to-layer="3906" to-port="0" /> <edge from-layer="3905" from-port="0" to-layer="3906" to-port="1" /> <edge from-layer="3906" from-port="2" to-layer="3908" to-port="0" /> <edge from-layer="3907" from-port="0" to-layer="3908" to-port="1" /> <edge from-layer="3908" from-port="2" to-layer="3909" to-port="1" /> <edge from-layer="3909" from-port="2" to-layer="3937" to-port="1" /> <edge from-layer="3909" from-port="2" to-layer="4946" to-port="0" /> <edge from-layer="3910" from-port="0" to-layer="3915" to-port="0" /> <edge from-layer="3911" from-port="0" to-layer="3914" to-port="1" /> <edge from-layer="3912" from-port="0" to-layer="3914" to-port="2" /> <edge from-layer="3913" from-port="0" to-layer="3914" to-port="3" /> <edge from-layer="3914" from-port="4" to-layer="3915" to-port="1" /> <edge from-layer="3915" from-port="2" to-layer="3916" to-port="0" /> <edge from-layer="3916" from-port="1" to-layer="3918" to-port="0" /> <edge from-layer="3917" from-port="0" to-layer="3918" to-port="2" /> <edge from-layer="3918" from-port="3" to-layer="3936" to-port="0" /> <edge from-layer="3919" from-port="0" to-layer="3920" to-port="0" /> <edge from-layer="3920" from-port="1" to-layer="3923" to-port="0" /> <edge from-layer="3921" from-port="0" to-layer="3922" to-port="0" /> <edge from-layer="3922" from-port="1" to-layer="3923" to-port="1" /> <edge from-layer="3923" from-port="2" to-layer="3925" to-port="0" /> <edge from-layer="3924" from-port="0" to-layer="3925" to-port="1" /> <edge from-layer="3925" from-port="2" to-layer="3927" to-port="0" /> <edge from-layer="3926" from-port="0" to-layer="3927" to-port="1" /> <edge from-layer="3927" from-port="2" to-layer="3928" to-port="0" /> <edge from-layer="3928" from-port="1" to-layer="3929" to-port="1" /> <edge from-layer="3929" from-port="2" to-layer="3931" to-port="0" /> <edge from-layer="3930" from-port="0" to-layer="3931" to-port="1" /> <edge from-layer="3931" from-port="2" to-layer="3933" to-port="0" /> <edge from-layer="3932" from-port="0" to-layer="3933" to-port="1" /> <edge from-layer="3933" from-port="2" to-layer="3935" to-port="0" /> <edge from-layer="3934" from-port="0" to-layer="3935" to-port="1" /> <edge from-layer="3935" from-port="2" to-layer="3936" to-port="1" /> <edge from-layer="3936" from-port="2" to-layer="3937" to-port="2" /> <edge from-layer="3936" from-port="2" to-layer="4945" to-port="0" /> <edge from-layer="3937" from-port="4" to-layer="3939" to-port="0" /> <edge from-layer="3938" from-port="0" to-layer="3939" to-port="1" /> <edge from-layer="3939" from-port="2" to-layer="3941" to-port="0" /> <edge from-layer="3940" from-port="0" to-layer="3941" to-port="1" /> <edge from-layer="3941" from-port="2" to-layer="3952" to-port="0" /> <edge from-layer="3942" from-port="0" to-layer="3943" to-port="0" /> <edge from-layer="3943" from-port="1" to-layer="3946" to-port="0" /> <edge from-layer="3944" from-port="0" to-layer="3945" to-port="0" /> <edge from-layer="3945" from-port="1" to-layer="3946" to-port="1" /> <edge from-layer="3946" from-port="2" to-layer="3948" to-port="0" /> <edge from-layer="3947" from-port="0" to-layer="3948" to-port="1" /> <edge from-layer="3948" from-port="2" to-layer="3950" to-port="0" /> <edge from-layer="3949" from-port="0" to-layer="3950" to-port="1" /> <edge from-layer="3950" from-port="2" to-layer="3951" to-port="0" /> <edge from-layer="3951" from-port="1" to-layer="3952" to-port="1" /> <edge from-layer="3952" from-port="2" to-layer="3954" to-port="0" /> <edge from-layer="3953" from-port="0" to-layer="3954" to-port="1" /> <edge from-layer="3954" from-port="2" to-layer="3955" to-port="1" /> <edge from-layer="3955" from-port="2" to-layer="3997" to-port="0" /> <edge from-layer="3955" from-port="2" to-layer="3957" to-port="0" /> <edge from-layer="3956" from-port="0" to-layer="3957" to-port="1" /> <edge from-layer="3957" from-port="2" to-layer="3959" to-port="0" /> <edge from-layer="3958" from-port="0" to-layer="3959" to-port="1" /> <edge from-layer="3959" from-port="2" to-layer="3961" to-port="0" /> <edge from-layer="3960" from-port="0" to-layer="3961" to-port="1" /> <edge from-layer="3961" from-port="2" to-layer="3972" to-port="0" /> <edge from-layer="3962" from-port="0" to-layer="3963" to-port="0" /> <edge from-layer="3963" from-port="1" to-layer="3966" to-port="0" /> <edge from-layer="3964" from-port="0" to-layer="3965" to-port="0" /> <edge from-layer="3965" from-port="1" to-layer="3966" to-port="1" /> <edge from-layer="3966" from-port="2" to-layer="3968" to-port="0" /> <edge from-layer="3967" from-port="0" to-layer="3968" to-port="1" /> <edge from-layer="3968" from-port="2" to-layer="3970" to-port="0" /> <edge from-layer="3969" from-port="0" to-layer="3970" to-port="1" /> <edge from-layer="3970" from-port="2" to-layer="3971" to-port="0" /> <edge from-layer="3971" from-port="1" to-layer="3972" to-port="1" /> <edge from-layer="3972" from-port="2" to-layer="3974" to-port="0" /> <edge from-layer="3973" from-port="0" to-layer="3974" to-port="1" /> <edge from-layer="3974" from-port="2" to-layer="3976" to-port="0" /> <edge from-layer="3975" from-port="0" to-layer="3976" to-port="1" /> <edge from-layer="3976" from-port="2" to-layer="3978" to-port="0" /> <edge from-layer="3977" from-port="0" to-layer="3978" to-port="1" /> <edge from-layer="3978" from-port="2" to-layer="3979" to-port="0" /> <edge from-layer="3979" from-port="3" to-layer="3981" to-port="0" /> <edge from-layer="3980" from-port="0" to-layer="3981" to-port="1" /> <edge from-layer="3981" from-port="2" to-layer="3983" to-port="0" /> <edge from-layer="3982" from-port="0" to-layer="3983" to-port="1" /> <edge from-layer="3983" from-port="2" to-layer="3994" to-port="0" /> <edge from-layer="3984" from-port="0" to-layer="3985" to-port="0" /> <edge from-layer="3985" from-port="1" to-layer="3988" to-port="0" /> <edge from-layer="3986" from-port="0" to-layer="3987" to-port="0" /> <edge from-layer="3987" from-port="1" to-layer="3988" to-port="1" /> <edge from-layer="3988" from-port="2" to-layer="3990" to-port="0" /> <edge from-layer="3989" from-port="0" to-layer="3990" to-port="1" /> <edge from-layer="3990" from-port="2" to-layer="3992" to-port="0" /> <edge from-layer="3991" from-port="0" to-layer="3992" to-port="1" /> <edge from-layer="3992" from-port="2" to-layer="3993" to-port="0" /> <edge from-layer="3993" from-port="1" to-layer="3994" to-port="1" /> <edge from-layer="3994" from-port="2" to-layer="3996" to-port="0" /> <edge from-layer="3995" from-port="0" to-layer="3996" to-port="1" /> <edge from-layer="3996" from-port="2" to-layer="3997" to-port="1" /> <edge from-layer="3997" from-port="2" to-layer="4031" to-port="0" /> <edge from-layer="3997" from-port="2" to-layer="3999" to-port="0" /> <edge from-layer="3998" from-port="0" to-layer="3999" to-port="1" /> <edge from-layer="3999" from-port="2" to-layer="4001" to-port="0" /> <edge from-layer="4000" from-port="0" to-layer="4001" to-port="1" /> <edge from-layer="4001" from-port="2" to-layer="4003" to-port="0" /> <edge from-layer="4002" from-port="0" to-layer="4003" to-port="1" /> <edge from-layer="4003" from-port="2" to-layer="4014" to-port="0" /> <edge from-layer="4004" from-port="0" to-layer="4005" to-port="0" /> <edge from-layer="4005" from-port="1" to-layer="4008" to-port="0" /> <edge from-layer="4006" from-port="0" to-layer="4007" to-port="0" /> <edge from-layer="4007" from-port="1" to-layer="4008" to-port="1" /> <edge from-layer="4008" from-port="2" to-layer="4010" to-port="0" /> <edge from-layer="4009" from-port="0" to-layer="4010" to-port="1" /> <edge from-layer="4010" from-port="2" to-layer="4012" to-port="0" /> <edge from-layer="4011" from-port="0" to-layer="4012" to-port="1" /> <edge from-layer="4012" from-port="2" to-layer="4013" to-port="0" /> <edge from-layer="4013" from-port="1" to-layer="4014" to-port="1" /> <edge from-layer="4014" from-port="2" to-layer="4016" to-port="0" /> <edge from-layer="4015" from-port="0" to-layer="4016" to-port="1" /> <edge from-layer="4016" from-port="2" to-layer="4017" to-port="0" /> <edge from-layer="4017" from-port="1" to-layer="4028" to-port="0" /> <edge from-layer="4018" from-port="0" to-layer="4019" to-port="0" /> <edge from-layer="4019" from-port="1" to-layer="4022" to-port="0" /> <edge from-layer="4020" from-port="0" to-layer="4021" to-port="0" /> <edge from-layer="4021" from-port="1" to-layer="4022" to-port="1" /> <edge from-layer="4022" from-port="2" to-layer="4024" to-port="0" /> <edge from-layer="4023" from-port="0" to-layer="4024" to-port="1" /> <edge from-layer="4024" from-port="2" to-layer="4026" to-port="0" /> <edge from-layer="4025" from-port="0" to-layer="4026" to-port="1" /> <edge from-layer="4026" from-port="2" to-layer="4027" to-port="0" /> <edge from-layer="4027" from-port="1" to-layer="4028" to-port="1" /> <edge from-layer="4028" from-port="2" to-layer="4030" to-port="0" /> <edge from-layer="4029" from-port="0" to-layer="4030" to-port="1" /> <edge from-layer="4030" from-port="2" to-layer="4031" to-port="1" /> <edge from-layer="4031" from-port="2" to-layer="4033" to-port="0" /> <edge from-layer="4031" from-port="2" to-layer="4125" to-port="0" /> <edge from-layer="4032" from-port="0" to-layer="4033" to-port="1" /> <edge from-layer="4033" from-port="2" to-layer="4035" to-port="0" /> <edge from-layer="4034" from-port="0" to-layer="4035" to-port="1" /> <edge from-layer="4035" from-port="2" to-layer="4037" to-port="0" /> <edge from-layer="4036" from-port="0" to-layer="4037" to-port="1" /> <edge from-layer="4037" from-port="2" to-layer="4048" to-port="0" /> <edge from-layer="4037" from-port="2" to-layer="4074" to-port="0" /> <edge from-layer="4037" from-port="2" to-layer="4099" to-port="0" /> <edge from-layer="4038" from-port="0" to-layer="4039" to-port="0" /> <edge from-layer="4039" from-port="1" to-layer="4042" to-port="0" /> <edge from-layer="4040" from-port="0" to-layer="4041" to-port="0" /> <edge from-layer="4041" from-port="1" to-layer="4042" to-port="1" /> <edge from-layer="4042" from-port="2" to-layer="4044" to-port="0" /> <edge from-layer="4043" from-port="0" to-layer="4044" to-port="1" /> <edge from-layer="4044" from-port="2" to-layer="4046" to-port="0" /> <edge from-layer="4045" from-port="0" to-layer="4046" to-port="1" /> <edge from-layer="4046" from-port="2" to-layer="4047" to-port="0" /> <edge from-layer="4047" from-port="1" to-layer="4048" to-port="1" /> <edge from-layer="4048" from-port="2" to-layer="4050" to-port="0" /> <edge from-layer="4049" from-port="0" to-layer="4050" to-port="1" /> <edge from-layer="4050" from-port="2" to-layer="4052" to-port="0" /> <edge from-layer="4051" from-port="0" to-layer="4052" to-port="1" /> <edge from-layer="4052" from-port="2" to-layer="4054" to-port="0" /> <edge from-layer="4053" from-port="0" to-layer="4054" to-port="1" /> <edge from-layer="4054" from-port="2" to-layer="4107" to-port="0" /> <edge from-layer="4055" from-port="0" to-layer="4060" to-port="0" /> <edge from-layer="4056" from-port="0" to-layer="4059" to-port="1" /> <edge from-layer="4057" from-port="0" to-layer="4059" to-port="2" /> <edge from-layer="4058" from-port="0" to-layer="4059" to-port="3" /> <edge from-layer="4059" from-port="4" to-layer="4060" to-port="1" /> <edge from-layer="4060" from-port="2" to-layer="4061" to-port="0" /> <edge from-layer="4061" from-port="1" to-layer="4063" to-port="0" /> <edge from-layer="4062" from-port="0" to-layer="4063" to-port="2" /> <edge from-layer="4063" from-port="3" to-layer="4079" to-port="0" /> <edge from-layer="4064" from-port="0" to-layer="4065" to-port="0" /> <edge from-layer="4065" from-port="1" to-layer="4068" to-port="0" /> <edge from-layer="4066" from-port="0" to-layer="4067" to-port="0" /> <edge from-layer="4067" from-port="1" to-layer="4068" to-port="1" /> <edge from-layer="4068" from-port="2" to-layer="4070" to-port="0" /> <edge from-layer="4069" from-port="0" to-layer="4070" to-port="1" /> <edge from-layer="4070" from-port="2" to-layer="4072" to-port="0" /> <edge from-layer="4071" from-port="0" to-layer="4072" to-port="1" /> <edge from-layer="4072" from-port="2" to-layer="4073" to-port="0" /> <edge from-layer="4073" from-port="1" to-layer="4074" to-port="1" /> <edge from-layer="4074" from-port="2" to-layer="4076" to-port="0" /> <edge from-layer="4075" from-port="0" to-layer="4076" to-port="1" /> <edge from-layer="4076" from-port="2" to-layer="4078" to-port="0" /> <edge from-layer="4077" from-port="0" to-layer="4078" to-port="1" /> <edge from-layer="4078" from-port="2" to-layer="4079" to-port="1" /> <edge from-layer="4079" from-port="2" to-layer="4944" to-port="0" /> <edge from-layer="4079" from-port="2" to-layer="4107" to-port="1" /> <edge from-layer="4080" from-port="0" to-layer="4085" to-port="0" /> <edge from-layer="4081" from-port="0" to-layer="4084" to-port="1" /> <edge from-layer="4082" from-port="0" to-layer="4084" to-port="2" /> <edge from-layer="4083" from-port="0" to-layer="4084" to-port="3" /> <edge from-layer="4084" from-port="4" to-layer="4085" to-port="1" /> <edge from-layer="4085" from-port="2" to-layer="4086" to-port="0" /> <edge from-layer="4086" from-port="1" to-layer="4088" to-port="0" /> <edge from-layer="4087" from-port="0" to-layer="4088" to-port="2" /> <edge from-layer="4088" from-port="3" to-layer="4106" to-port="0" /> <edge from-layer="4089" from-port="0" to-layer="4090" to-port="0" /> <edge from-layer="4090" from-port="1" to-layer="4093" to-port="0" /> <edge from-layer="4091" from-port="0" to-layer="4092" to-port="0" /> <edge from-layer="4092" from-port="1" to-layer="4093" to-port="1" /> <edge from-layer="4093" from-port="2" to-layer="4095" to-port="0" /> <edge from-layer="4094" from-port="0" to-layer="4095" to-port="1" /> <edge from-layer="4095" from-port="2" to-layer="4097" to-port="0" /> <edge from-layer="4096" from-port="0" to-layer="4097" to-port="1" /> <edge from-layer="4097" from-port="2" to-layer="4098" to-port="0" /> <edge from-layer="4098" from-port="1" to-layer="4099" to-port="1" /> <edge from-layer="4099" from-port="2" to-layer="4101" to-port="0" /> <edge from-layer="4100" from-port="0" to-layer="4101" to-port="1" /> <edge from-layer="4101" from-port="2" to-layer="4103" to-port="0" /> <edge from-layer="4102" from-port="0" to-layer="4103" to-port="1" /> <edge from-layer="4103" from-port="2" to-layer="4105" to-port="0" /> <edge from-layer="4104" from-port="0" to-layer="4105" to-port="1" /> <edge from-layer="4105" from-port="2" to-layer="4106" to-port="1" /> <edge from-layer="4106" from-port="2" to-layer="4107" to-port="2" /> <edge from-layer="4106" from-port="2" to-layer="4943" to-port="0" /> <edge from-layer="4107" from-port="4" to-layer="4109" to-port="0" /> <edge from-layer="4108" from-port="0" to-layer="4109" to-port="1" /> <edge from-layer="4109" from-port="2" to-layer="4111" to-port="0" /> <edge from-layer="4110" from-port="0" to-layer="4111" to-port="1" /> <edge from-layer="4111" from-port="2" to-layer="4122" to-port="0" /> <edge from-layer="4112" from-port="0" to-layer="4113" to-port="0" /> <edge from-layer="4113" from-port="1" to-layer="4116" to-port="0" /> <edge from-layer="4114" from-port="0" to-layer="4115" to-port="0" /> <edge from-layer="4115" from-port="1" to-layer="4116" to-port="1" /> <edge from-layer="4116" from-port="2" to-layer="4118" to-port="0" /> <edge from-layer="4117" from-port="0" to-layer="4118" to-port="1" /> <edge from-layer="4118" from-port="2" to-layer="4120" to-port="0" /> <edge from-layer="4119" from-port="0" to-layer="4120" to-port="1" /> <edge from-layer="4120" from-port="2" to-layer="4121" to-port="0" /> <edge from-layer="4121" from-port="1" to-layer="4122" to-port="1" /> <edge from-layer="4122" from-port="2" to-layer="4124" to-port="0" /> <edge from-layer="4123" from-port="0" to-layer="4124" to-port="1" /> <edge from-layer="4124" from-port="2" to-layer="4125" to-port="1" /> <edge from-layer="4125" from-port="2" to-layer="4127" to-port="0" /> <edge from-layer="4125" from-port="2" to-layer="4167" to-port="0" /> <edge from-layer="4126" from-port="0" to-layer="4127" to-port="1" /> <edge from-layer="4127" from-port="2" to-layer="4129" to-port="0" /> <edge from-layer="4128" from-port="0" to-layer="4129" to-port="1" /> <edge from-layer="4129" from-port="2" to-layer="4131" to-port="0" /> <edge from-layer="4130" from-port="0" to-layer="4131" to-port="1" /> <edge from-layer="4131" from-port="2" to-layer="4142" to-port="0" /> <edge from-layer="4132" from-port="0" to-layer="4133" to-port="0" /> <edge from-layer="4133" from-port="1" to-layer="4136" to-port="0" /> <edge from-layer="4134" from-port="0" to-layer="4135" to-port="0" /> <edge from-layer="4135" from-port="1" to-layer="4136" to-port="1" /> <edge from-layer="4136" from-port="2" to-layer="4138" to-port="0" /> <edge from-layer="4137" from-port="0" to-layer="4138" to-port="1" /> <edge from-layer="4138" from-port="2" to-layer="4140" to-port="0" /> <edge from-layer="4139" from-port="0" to-layer="4140" to-port="1" /> <edge from-layer="4140" from-port="2" to-layer="4141" to-port="0" /> <edge from-layer="4141" from-port="1" to-layer="4142" to-port="1" /> <edge from-layer="4142" from-port="2" to-layer="4144" to-port="0" /> <edge from-layer="4143" from-port="0" to-layer="4144" to-port="1" /> <edge from-layer="4144" from-port="2" to-layer="4146" to-port="0" /> <edge from-layer="4145" from-port="0" to-layer="4146" to-port="1" /> <edge from-layer="4146" from-port="2" to-layer="4148" to-port="0" /> <edge from-layer="4147" from-port="0" to-layer="4148" to-port="1" /> <edge from-layer="4148" from-port="2" to-layer="4149" to-port="0" /> <edge from-layer="4149" from-port="3" to-layer="4151" to-port="0" /> <edge from-layer="4150" from-port="0" to-layer="4151" to-port="1" /> <edge from-layer="4151" from-port="2" to-layer="4153" to-port="0" /> <edge from-layer="4152" from-port="0" to-layer="4153" to-port="1" /> <edge from-layer="4153" from-port="2" to-layer="4164" to-port="0" /> <edge from-layer="4154" from-port="0" to-layer="4155" to-port="0" /> <edge from-layer="4155" from-port="1" to-layer="4158" to-port="0" /> <edge from-layer="4156" from-port="0" to-layer="4157" to-port="0" /> <edge from-layer="4157" from-port="1" to-layer="4158" to-port="1" /> <edge from-layer="4158" from-port="2" to-layer="4160" to-port="0" /> <edge from-layer="4159" from-port="0" to-layer="4160" to-port="1" /> <edge from-layer="4160" from-port="2" to-layer="4162" to-port="0" /> <edge from-layer="4161" from-port="0" to-layer="4162" to-port="1" /> <edge from-layer="4162" from-port="2" to-layer="4163" to-port="0" /> <edge from-layer="4163" from-port="1" to-layer="4164" to-port="1" /> <edge from-layer="4164" from-port="2" to-layer="4166" to-port="0" /> <edge from-layer="4165" from-port="0" to-layer="4166" to-port="1" /> <edge from-layer="4166" from-port="2" to-layer="4167" to-port="1" /> <edge from-layer="4167" from-port="2" to-layer="4201" to-port="0" /> <edge from-layer="4167" from-port="2" to-layer="4169" to-port="0" /> <edge from-layer="4168" from-port="0" to-layer="4169" to-port="1" /> <edge from-layer="4169" from-port="2" to-layer="4171" to-port="0" /> <edge from-layer="4170" from-port="0" to-layer="4171" to-port="1" /> <edge from-layer="4171" from-port="2" to-layer="4173" to-port="0" /> <edge from-layer="4172" from-port="0" to-layer="4173" to-port="1" /> <edge from-layer="4173" from-port="2" to-layer="4184" to-port="0" /> <edge from-layer="4174" from-port="0" to-layer="4175" to-port="0" /> <edge from-layer="4175" from-port="1" to-layer="4178" to-port="0" /> <edge from-layer="4176" from-port="0" to-layer="4177" to-port="0" /> <edge from-layer="4177" from-port="1" to-layer="4178" to-port="1" /> <edge from-layer="4178" from-port="2" to-layer="4180" to-port="0" /> <edge from-layer="4179" from-port="0" to-layer="4180" to-port="1" /> <edge from-layer="4180" from-port="2" to-layer="4182" to-port="0" /> <edge from-layer="4181" from-port="0" to-layer="4182" to-port="1" /> <edge from-layer="4182" from-port="2" to-layer="4183" to-port="0" /> <edge from-layer="4183" from-port="1" to-layer="4184" to-port="1" /> <edge from-layer="4184" from-port="2" to-layer="4186" to-port="0" /> <edge from-layer="4185" from-port="0" to-layer="4186" to-port="1" /> <edge from-layer="4186" from-port="2" to-layer="4187" to-port="0" /> <edge from-layer="4187" from-port="1" to-layer="4198" to-port="0" /> <edge from-layer="4188" from-port="0" to-layer="4189" to-port="0" /> <edge from-layer="4189" from-port="1" to-layer="4192" to-port="0" /> <edge from-layer="4190" from-port="0" to-layer="4191" to-port="0" /> <edge from-layer="4191" from-port="1" to-layer="4192" to-port="1" /> <edge from-layer="4192" from-port="2" to-layer="4194" to-port="0" /> <edge from-layer="4193" from-port="0" to-layer="4194" to-port="1" /> <edge from-layer="4194" from-port="2" to-layer="4196" to-port="0" /> <edge from-layer="4195" from-port="0" to-layer="4196" to-port="1" /> <edge from-layer="4196" from-port="2" to-layer="4197" to-port="0" /> <edge from-layer="4197" from-port="1" to-layer="4198" to-port="1" /> <edge from-layer="4198" from-port="2" to-layer="4200" to-port="0" /> <edge from-layer="4199" from-port="0" to-layer="4200" to-port="1" /> <edge from-layer="4200" from-port="2" to-layer="4201" to-port="1" /> <edge from-layer="4201" from-port="2" to-layer="4295" to-port="0" /> <edge from-layer="4201" from-port="2" to-layer="4203" to-port="0" /> <edge from-layer="4202" from-port="0" to-layer="4203" to-port="1" /> <edge from-layer="4203" from-port="2" to-layer="4205" to-port="0" /> <edge from-layer="4204" from-port="0" to-layer="4205" to-port="1" /> <edge from-layer="4205" from-port="2" to-layer="4207" to-port="0" /> <edge from-layer="4206" from-port="0" to-layer="4207" to-port="1" /> <edge from-layer="4207" from-port="2" to-layer="4244" to-port="0" /> <edge from-layer="4207" from-port="2" to-layer="4218" to-port="0" /> <edge from-layer="4207" from-port="2" to-layer="4269" to-port="0" /> <edge from-layer="4208" from-port="0" to-layer="4209" to-port="0" /> <edge from-layer="4209" from-port="1" to-layer="4212" to-port="0" /> <edge from-layer="4210" from-port="0" to-layer="4211" to-port="0" /> <edge from-layer="4211" from-port="1" to-layer="4212" to-port="1" /> <edge from-layer="4212" from-port="2" to-layer="4214" to-port="0" /> <edge from-layer="4213" from-port="0" to-layer="4214" to-port="1" /> <edge from-layer="4214" from-port="2" to-layer="4216" to-port="0" /> <edge from-layer="4215" from-port="0" to-layer="4216" to-port="1" /> <edge from-layer="4216" from-port="2" to-layer="4217" to-port="0" /> <edge from-layer="4217" from-port="1" to-layer="4218" to-port="1" /> <edge from-layer="4218" from-port="2" to-layer="4220" to-port="0" /> <edge from-layer="4219" from-port="0" to-layer="4220" to-port="1" /> <edge from-layer="4220" from-port="2" to-layer="4222" to-port="0" /> <edge from-layer="4221" from-port="0" to-layer="4222" to-port="1" /> <edge from-layer="4222" from-port="2" to-layer="4224" to-port="0" /> <edge from-layer="4223" from-port="0" to-layer="4224" to-port="1" /> <edge from-layer="4224" from-port="2" to-layer="4277" to-port="0" /> <edge from-layer="4225" from-port="0" to-layer="4230" to-port="0" /> <edge from-layer="4226" from-port="0" to-layer="4229" to-port="1" /> <edge from-layer="4227" from-port="0" to-layer="4229" to-port="2" /> <edge from-layer="4228" from-port="0" to-layer="4229" to-port="3" /> <edge from-layer="4229" from-port="4" to-layer="4230" to-port="1" /> <edge from-layer="4230" from-port="2" to-layer="4231" to-port="0" /> <edge from-layer="4231" from-port="1" to-layer="4233" to-port="0" /> <edge from-layer="4232" from-port="0" to-layer="4233" to-port="2" /> <edge from-layer="4233" from-port="3" to-layer="4249" to-port="0" /> <edge from-layer="4234" from-port="0" to-layer="4235" to-port="0" /> <edge from-layer="4235" from-port="1" to-layer="4238" to-port="0" /> <edge from-layer="4236" from-port="0" to-layer="4237" to-port="0" /> <edge from-layer="4237" from-port="1" to-layer="4238" to-port="1" /> <edge from-layer="4238" from-port="2" to-layer="4240" to-port="0" /> <edge from-layer="4239" from-port="0" to-layer="4240" to-port="1" /> <edge from-layer="4240" from-port="2" to-layer="4242" to-port="0" /> <edge from-layer="4241" from-port="0" to-layer="4242" to-port="1" /> <edge from-layer="4242" from-port="2" to-layer="4243" to-port="0" /> <edge from-layer="4243" from-port="1" to-layer="4244" to-port="1" /> <edge from-layer="4244" from-port="2" to-layer="4246" to-port="0" /> <edge from-layer="4245" from-port="0" to-layer="4246" to-port="1" /> <edge from-layer="4246" from-port="2" to-layer="4248" to-port="0" /> <edge from-layer="4247" from-port="0" to-layer="4248" to-port="1" /> <edge from-layer="4248" from-port="2" to-layer="4249" to-port="1" /> <edge from-layer="4249" from-port="2" to-layer="4277" to-port="1" /> <edge from-layer="4249" from-port="2" to-layer="4942" to-port="0" /> <edge from-layer="4250" from-port="0" to-layer="4255" to-port="0" /> <edge from-layer="4251" from-port="0" to-layer="4254" to-port="1" /> <edge from-layer="4252" from-port="0" to-layer="4254" to-port="2" /> <edge from-layer="4253" from-port="0" to-layer="4254" to-port="3" /> <edge from-layer="4254" from-port="4" to-layer="4255" to-port="1" /> <edge from-layer="4255" from-port="2" to-layer="4256" to-port="0" /> <edge from-layer="4256" from-port="1" to-layer="4258" to-port="0" /> <edge from-layer="4257" from-port="0" to-layer="4258" to-port="2" /> <edge from-layer="4258" from-port="3" to-layer="4276" to-port="0" /> <edge from-layer="4259" from-port="0" to-layer="4260" to-port="0" /> <edge from-layer="4260" from-port="1" to-layer="4263" to-port="0" /> <edge from-layer="4261" from-port="0" to-layer="4262" to-port="0" /> <edge from-layer="4262" from-port="1" to-layer="4263" to-port="1" /> <edge from-layer="4263" from-port="2" to-layer="4265" to-port="0" /> <edge from-layer="4264" from-port="0" to-layer="4265" to-port="1" /> <edge from-layer="4265" from-port="2" to-layer="4267" to-port="0" /> <edge from-layer="4266" from-port="0" to-layer="4267" to-port="1" /> <edge from-layer="4267" from-port="2" to-layer="4268" to-port="0" /> <edge from-layer="4268" from-port="1" to-layer="4269" to-port="1" /> <edge from-layer="4269" from-port="2" to-layer="4271" to-port="0" /> <edge from-layer="4270" from-port="0" to-layer="4271" to-port="1" /> <edge from-layer="4271" from-port="2" to-layer="4273" to-port="0" /> <edge from-layer="4272" from-port="0" to-layer="4273" to-port="1" /> <edge from-layer="4273" from-port="2" to-layer="4275" to-port="0" /> <edge from-layer="4274" from-port="0" to-layer="4275" to-port="1" /> <edge from-layer="4275" from-port="2" to-layer="4276" to-port="1" /> <edge from-layer="4276" from-port="2" to-layer="4941" to-port="0" /> <edge from-layer="4276" from-port="2" to-layer="4277" to-port="2" /> <edge from-layer="4277" from-port="4" to-layer="4279" to-port="0" /> <edge from-layer="4278" from-port="0" to-layer="4279" to-port="1" /> <edge from-layer="4279" from-port="2" to-layer="4281" to-port="0" /> <edge from-layer="4280" from-port="0" to-layer="4281" to-port="1" /> <edge from-layer="4281" from-port="2" to-layer="4292" to-port="0" /> <edge from-layer="4282" from-port="0" to-layer="4283" to-port="0" /> <edge from-layer="4283" from-port="1" to-layer="4286" to-port="0" /> <edge from-layer="4284" from-port="0" to-layer="4285" to-port="0" /> <edge from-layer="4285" from-port="1" to-layer="4286" to-port="1" /> <edge from-layer="4286" from-port="2" to-layer="4288" to-port="0" /> <edge from-layer="4287" from-port="0" to-layer="4288" to-port="1" /> <edge from-layer="4288" from-port="2" to-layer="4290" to-port="0" /> <edge from-layer="4289" from-port="0" to-layer="4290" to-port="1" /> <edge from-layer="4290" from-port="2" to-layer="4291" to-port="0" /> <edge from-layer="4291" from-port="1" to-layer="4292" to-port="1" /> <edge from-layer="4292" from-port="2" to-layer="4294" to-port="0" /> <edge from-layer="4293" from-port="0" to-layer="4294" to-port="1" /> <edge from-layer="4294" from-port="2" to-layer="4295" to-port="1" /> <edge from-layer="4295" from-port="2" to-layer="4337" to-port="0" /> <edge from-layer="4295" from-port="2" to-layer="4297" to-port="0" /> <edge from-layer="4296" from-port="0" to-layer="4297" to-port="1" /> <edge from-layer="4297" from-port="2" to-layer="4299" to-port="0" /> <edge from-layer="4298" from-port="0" to-layer="4299" to-port="1" /> <edge from-layer="4299" from-port="2" to-layer="4301" to-port="0" /> <edge from-layer="4300" from-port="0" to-layer="4301" to-port="1" /> <edge from-layer="4301" from-port="2" to-layer="4312" to-port="0" /> <edge from-layer="4302" from-port="0" to-layer="4303" to-port="0" /> <edge from-layer="4303" from-port="1" to-layer="4306" to-port="0" /> <edge from-layer="4304" from-port="0" to-layer="4305" to-port="0" /> <edge from-layer="4305" from-port="1" to-layer="4306" to-port="1" /> <edge from-layer="4306" from-port="2" to-layer="4308" to-port="0" /> <edge from-layer="4307" from-port="0" to-layer="4308" to-port="1" /> <edge from-layer="4308" from-port="2" to-layer="4310" to-port="0" /> <edge from-layer="4309" from-port="0" to-layer="4310" to-port="1" /> <edge from-layer="4310" from-port="2" to-layer="4311" to-port="0" /> <edge from-layer="4311" from-port="1" to-layer="4312" to-port="1" /> <edge from-layer="4312" from-port="2" to-layer="4314" to-port="0" /> <edge from-layer="4313" from-port="0" to-layer="4314" to-port="1" /> <edge from-layer="4314" from-port="2" to-layer="4316" to-port="0" /> <edge from-layer="4315" from-port="0" to-layer="4316" to-port="1" /> <edge from-layer="4316" from-port="2" to-layer="4318" to-port="0" /> <edge from-layer="4317" from-port="0" to-layer="4318" to-port="1" /> <edge from-layer="4318" from-port="2" to-layer="4319" to-port="0" /> <edge from-layer="4319" from-port="3" to-layer="4321" to-port="0" /> <edge from-layer="4320" from-port="0" to-layer="4321" to-port="1" /> <edge from-layer="4321" from-port="2" to-layer="4323" to-port="0" /> <edge from-layer="4322" from-port="0" to-layer="4323" to-port="1" /> <edge from-layer="4323" from-port="2" to-layer="4334" to-port="0" /> <edge from-layer="4324" from-port="0" to-layer="4325" to-port="0" /> <edge from-layer="4325" from-port="1" to-layer="4328" to-port="0" /> <edge from-layer="4326" from-port="0" to-layer="4327" to-port="0" /> <edge from-layer="4327" from-port="1" to-layer="4328" to-port="1" /> <edge from-layer="4328" from-port="2" to-layer="4330" to-port="0" /> <edge from-layer="4329" from-port="0" to-layer="4330" to-port="1" /> <edge from-layer="4330" from-port="2" to-layer="4332" to-port="0" /> <edge from-layer="4331" from-port="0" to-layer="4332" to-port="1" /> <edge from-layer="4332" from-port="2" to-layer="4333" to-port="0" /> <edge from-layer="4333" from-port="1" to-layer="4334" to-port="1" /> <edge from-layer="4334" from-port="2" to-layer="4336" to-port="0" /> <edge from-layer="4335" from-port="0" to-layer="4336" to-port="1" /> <edge from-layer="4336" from-port="2" to-layer="4337" to-port="1" /> <edge from-layer="4337" from-port="2" to-layer="4371" to-port="0" /> <edge from-layer="4337" from-port="2" to-layer="4339" to-port="0" /> <edge from-layer="4338" from-port="0" to-layer="4339" to-port="1" /> <edge from-layer="4339" from-port="2" to-layer="4341" to-port="0" /> <edge from-layer="4340" from-port="0" to-layer="4341" to-port="1" /> <edge from-layer="4341" from-port="2" to-layer="4343" to-port="0" /> <edge from-layer="4342" from-port="0" to-layer="4343" to-port="1" /> <edge from-layer="4343" from-port="2" to-layer="4354" to-port="0" /> <edge from-layer="4344" from-port="0" to-layer="4345" to-port="0" /> <edge from-layer="4345" from-port="1" to-layer="4348" to-port="0" /> <edge from-layer="4346" from-port="0" to-layer="4347" to-port="0" /> <edge from-layer="4347" from-port="1" to-layer="4348" to-port="1" /> <edge from-layer="4348" from-port="2" to-layer="4350" to-port="0" /> <edge from-layer="4349" from-port="0" to-layer="4350" to-port="1" /> <edge from-layer="4350" from-port="2" to-layer="4352" to-port="0" /> <edge from-layer="4351" from-port="0" to-layer="4352" to-port="1" /> <edge from-layer="4352" from-port="2" to-layer="4353" to-port="0" /> <edge from-layer="4353" from-port="1" to-layer="4354" to-port="1" /> <edge from-layer="4354" from-port="2" to-layer="4356" to-port="0" /> <edge from-layer="4355" from-port="0" to-layer="4356" to-port="1" /> <edge from-layer="4356" from-port="2" to-layer="4357" to-port="0" /> <edge from-layer="4357" from-port="1" to-layer="4368" to-port="0" /> <edge from-layer="4358" from-port="0" to-layer="4359" to-port="0" /> <edge from-layer="4359" from-port="1" to-layer="4362" to-port="0" /> <edge from-layer="4360" from-port="0" to-layer="4361" to-port="0" /> <edge from-layer="4361" from-port="1" to-layer="4362" to-port="1" /> <edge from-layer="4362" from-port="2" to-layer="4364" to-port="0" /> <edge from-layer="4363" from-port="0" to-layer="4364" to-port="1" /> <edge from-layer="4364" from-port="2" to-layer="4366" to-port="0" /> <edge from-layer="4365" from-port="0" to-layer="4366" to-port="1" /> <edge from-layer="4366" from-port="2" to-layer="4367" to-port="0" /> <edge from-layer="4367" from-port="1" to-layer="4368" to-port="1" /> <edge from-layer="4368" from-port="2" to-layer="4370" to-port="0" /> <edge from-layer="4369" from-port="0" to-layer="4370" to-port="1" /> <edge from-layer="4370" from-port="2" to-layer="4371" to-port="1" /> <edge from-layer="4371" from-port="2" to-layer="4373" to-port="0" /> <edge from-layer="4371" from-port="2" to-layer="4465" to-port="0" /> <edge from-layer="4372" from-port="0" to-layer="4373" to-port="1" /> <edge from-layer="4373" from-port="2" to-layer="4375" to-port="0" /> <edge from-layer="4374" from-port="0" to-layer="4375" to-port="1" /> <edge from-layer="4375" from-port="2" to-layer="4377" to-port="0" /> <edge from-layer="4376" from-port="0" to-layer="4377" to-port="1" /> <edge from-layer="4377" from-port="2" to-layer="4414" to-port="0" /> <edge from-layer="4377" from-port="2" to-layer="4388" to-port="0" /> <edge from-layer="4377" from-port="2" to-layer="4439" to-port="0" /> <edge from-layer="4378" from-port="0" to-layer="4379" to-port="0" /> <edge from-layer="4379" from-port="1" to-layer="4382" to-port="0" /> <edge from-layer="4380" from-port="0" to-layer="4381" to-port="0" /> <edge from-layer="4381" from-port="1" to-layer="4382" to-port="1" /> <edge from-layer="4382" from-port="2" to-layer="4384" to-port="0" /> <edge from-layer="4383" from-port="0" to-layer="4384" to-port="1" /> <edge from-layer="4384" from-port="2" to-layer="4386" to-port="0" /> <edge from-layer="4385" from-port="0" to-layer="4386" to-port="1" /> <edge from-layer="4386" from-port="2" to-layer="4387" to-port="0" /> <edge from-layer="4387" from-port="1" to-layer="4388" to-port="1" /> <edge from-layer="4388" from-port="2" to-layer="4390" to-port="0" /> <edge from-layer="4389" from-port="0" to-layer="4390" to-port="1" /> <edge from-layer="4390" from-port="2" to-layer="4392" to-port="0" /> <edge from-layer="4391" from-port="0" to-layer="4392" to-port="1" /> <edge from-layer="4392" from-port="2" to-layer="4394" to-port="0" /> <edge from-layer="4393" from-port="0" to-layer="4394" to-port="1" /> <edge from-layer="4394" from-port="2" to-layer="4447" to-port="0" /> <edge from-layer="4395" from-port="0" to-layer="4400" to-port="0" /> <edge from-layer="4396" from-port="0" to-layer="4399" to-port="1" /> <edge from-layer="4397" from-port="0" to-layer="4399" to-port="2" /> <edge from-layer="4398" from-port="0" to-layer="4399" to-port="3" /> <edge from-layer="4399" from-port="4" to-layer="4400" to-port="1" /> <edge from-layer="4400" from-port="2" to-layer="4401" to-port="0" /> <edge from-layer="4401" from-port="1" to-layer="4403" to-port="0" /> <edge from-layer="4402" from-port="0" to-layer="4403" to-port="2" /> <edge from-layer="4403" from-port="3" to-layer="4419" to-port="0" /> <edge from-layer="4404" from-port="0" to-layer="4405" to-port="0" /> <edge from-layer="4405" from-port="1" to-layer="4408" to-port="0" /> <edge from-layer="4406" from-port="0" to-layer="4407" to-port="0" /> <edge from-layer="4407" from-port="1" to-layer="4408" to-port="1" /> <edge from-layer="4408" from-port="2" to-layer="4410" to-port="0" /> <edge from-layer="4409" from-port="0" to-layer="4410" to-port="1" /> <edge from-layer="4410" from-port="2" to-layer="4412" to-port="0" /> <edge from-layer="4411" from-port="0" to-layer="4412" to-port="1" /> <edge from-layer="4412" from-port="2" to-layer="4413" to-port="0" /> <edge from-layer="4413" from-port="1" to-layer="4414" to-port="1" /> <edge from-layer="4414" from-port="2" to-layer="4416" to-port="0" /> <edge from-layer="4415" from-port="0" to-layer="4416" to-port="1" /> <edge from-layer="4416" from-port="2" to-layer="4418" to-port="0" /> <edge from-layer="4417" from-port="0" to-layer="4418" to-port="1" /> <edge from-layer="4418" from-port="2" to-layer="4419" to-port="1" /> <edge from-layer="4419" from-port="2" to-layer="4447" to-port="1" /> <edge from-layer="4419" from-port="2" to-layer="4938" to-port="0" /> <edge from-layer="4420" from-port="0" to-layer="4425" to-port="0" /> <edge from-layer="4421" from-port="0" to-layer="4424" to-port="1" /> <edge from-layer="4422" from-port="0" to-layer="4424" to-port="2" /> <edge from-layer="4423" from-port="0" to-layer="4424" to-port="3" /> <edge from-layer="4424" from-port="4" to-layer="4425" to-port="1" /> <edge from-layer="4425" from-port="2" to-layer="4426" to-port="0" /> <edge from-layer="4426" from-port="1" to-layer="4428" to-port="0" /> <edge from-layer="4427" from-port="0" to-layer="4428" to-port="2" /> <edge from-layer="4428" from-port="3" to-layer="4446" to-port="0" /> <edge from-layer="4429" from-port="0" to-layer="4430" to-port="0" /> <edge from-layer="4430" from-port="1" to-layer="4433" to-port="0" /> <edge from-layer="4431" from-port="0" to-layer="4432" to-port="0" /> <edge from-layer="4432" from-port="1" to-layer="4433" to-port="1" /> <edge from-layer="4433" from-port="2" to-layer="4435" to-port="0" /> <edge from-layer="4434" from-port="0" to-layer="4435" to-port="1" /> <edge from-layer="4435" from-port="2" to-layer="4437" to-port="0" /> <edge from-layer="4436" from-port="0" to-layer="4437" to-port="1" /> <edge from-layer="4437" from-port="2" to-layer="4438" to-port="0" /> <edge from-layer="4438" from-port="1" to-layer="4439" to-port="1" /> <edge from-layer="4439" from-port="2" to-layer="4441" to-port="0" /> <edge from-layer="4440" from-port="0" to-layer="4441" to-port="1" /> <edge from-layer="4441" from-port="2" to-layer="4443" to-port="0" /> <edge from-layer="4442" from-port="0" to-layer="4443" to-port="1" /> <edge from-layer="4443" from-port="2" to-layer="4445" to-port="0" /> <edge from-layer="4444" from-port="0" to-layer="4445" to-port="1" /> <edge from-layer="4445" from-port="2" to-layer="4446" to-port="1" /> <edge from-layer="4446" from-port="2" to-layer="4447" to-port="2" /> <edge from-layer="4446" from-port="2" to-layer="4937" to-port="0" /> <edge from-layer="4447" from-port="4" to-layer="4449" to-port="0" /> <edge from-layer="4448" from-port="0" to-layer="4449" to-port="1" /> <edge from-layer="4449" from-port="2" to-layer="4451" to-port="0" /> <edge from-layer="4450" from-port="0" to-layer="4451" to-port="1" /> <edge from-layer="4451" from-port="2" to-layer="4462" to-port="0" /> <edge from-layer="4452" from-port="0" to-layer="4453" to-port="0" /> <edge from-layer="4453" from-port="1" to-layer="4456" to-port="0" /> <edge from-layer="4454" from-port="0" to-layer="4455" to-port="0" /> <edge from-layer="4455" from-port="1" to-layer="4456" to-port="1" /> <edge from-layer="4456" from-port="2" to-layer="4458" to-port="0" /> <edge from-layer="4457" from-port="0" to-layer="4458" to-port="1" /> <edge from-layer="4458" from-port="2" to-layer="4460" to-port="0" /> <edge from-layer="4459" from-port="0" to-layer="4460" to-port="1" /> <edge from-layer="4460" from-port="2" to-layer="4461" to-port="0" /> <edge from-layer="4461" from-port="1" to-layer="4462" to-port="1" /> <edge from-layer="4462" from-port="2" to-layer="4464" to-port="0" /> <edge from-layer="4463" from-port="0" to-layer="4464" to-port="1" /> <edge from-layer="4464" from-port="2" to-layer="4465" to-port="1" /> <edge from-layer="4465" from-port="2" to-layer="4507" to-port="0" /> <edge from-layer="4465" from-port="2" to-layer="4467" to-port="0" /> <edge from-layer="4466" from-port="0" to-layer="4467" to-port="1" /> <edge from-layer="4467" from-port="2" to-layer="4469" to-port="0" /> <edge from-layer="4468" from-port="0" to-layer="4469" to-port="1" /> <edge from-layer="4469" from-port="2" to-layer="4471" to-port="0" /> <edge from-layer="4470" from-port="0" to-layer="4471" to-port="1" /> <edge from-layer="4471" from-port="2" to-layer="4482" to-port="0" /> <edge from-layer="4472" from-port="0" to-layer="4473" to-port="0" /> <edge from-layer="4473" from-port="1" to-layer="4476" to-port="0" /> <edge from-layer="4474" from-port="0" to-layer="4475" to-port="0" /> <edge from-layer="4475" from-port="1" to-layer="4476" to-port="1" /> <edge from-layer="4476" from-port="2" to-layer="4478" to-port="0" /> <edge from-layer="4477" from-port="0" to-layer="4478" to-port="1" /> <edge from-layer="4478" from-port="2" to-layer="4480" to-port="0" /> <edge from-layer="4479" from-port="0" to-layer="4480" to-port="1" /> <edge from-layer="4480" from-port="2" to-layer="4481" to-port="0" /> <edge from-layer="4481" from-port="1" to-layer="4482" to-port="1" /> <edge from-layer="4482" from-port="2" to-layer="4484" to-port="0" /> <edge from-layer="4483" from-port="0" to-layer="4484" to-port="1" /> <edge from-layer="4484" from-port="2" to-layer="4486" to-port="0" /> <edge from-layer="4485" from-port="0" to-layer="4486" to-port="1" /> <edge from-layer="4486" from-port="2" to-layer="4488" to-port="0" /> <edge from-layer="4487" from-port="0" to-layer="4488" to-port="1" /> <edge from-layer="4488" from-port="2" to-layer="4489" to-port="0" /> <edge from-layer="4489" from-port="3" to-layer="4491" to-port="0" /> <edge from-layer="4490" from-port="0" to-layer="4491" to-port="1" /> <edge from-layer="4491" from-port="2" to-layer="4493" to-port="0" /> <edge from-layer="4492" from-port="0" to-layer="4493" to-port="1" /> <edge from-layer="4493" from-port="2" to-layer="4504" to-port="0" /> <edge from-layer="4494" from-port="0" to-layer="4495" to-port="0" /> <edge from-layer="4495" from-port="1" to-layer="4498" to-port="0" /> <edge from-layer="4496" from-port="0" to-layer="4497" to-port="0" /> <edge from-layer="4497" from-port="1" to-layer="4498" to-port="1" /> <edge from-layer="4498" from-port="2" to-layer="4500" to-port="0" /> <edge from-layer="4499" from-port="0" to-layer="4500" to-port="1" /> <edge from-layer="4500" from-port="2" to-layer="4502" to-port="0" /> <edge from-layer="4501" from-port="0" to-layer="4502" to-port="1" /> <edge from-layer="4502" from-port="2" to-layer="4503" to-port="0" /> <edge from-layer="4503" from-port="1" to-layer="4504" to-port="1" /> <edge from-layer="4504" from-port="2" to-layer="4506" to-port="0" /> <edge from-layer="4505" from-port="0" to-layer="4506" to-port="1" /> <edge from-layer="4506" from-port="2" to-layer="4507" to-port="1" /> <edge from-layer="4507" from-port="2" to-layer="4541" to-port="0" /> <edge from-layer="4507" from-port="2" to-layer="4509" to-port="0" /> <edge from-layer="4508" from-port="0" to-layer="4509" to-port="1" /> <edge from-layer="4509" from-port="2" to-layer="4511" to-port="0" /> <edge from-layer="4510" from-port="0" to-layer="4511" to-port="1" /> <edge from-layer="4511" from-port="2" to-layer="4513" to-port="0" /> <edge from-layer="4512" from-port="0" to-layer="4513" to-port="1" /> <edge from-layer="4513" from-port="2" to-layer="4524" to-port="0" /> <edge from-layer="4514" from-port="0" to-layer="4515" to-port="0" /> <edge from-layer="4515" from-port="1" to-layer="4518" to-port="0" /> <edge from-layer="4516" from-port="0" to-layer="4517" to-port="0" /> <edge from-layer="4517" from-port="1" to-layer="4518" to-port="1" /> <edge from-layer="4518" from-port="2" to-layer="4520" to-port="0" /> <edge from-layer="4519" from-port="0" to-layer="4520" to-port="1" /> <edge from-layer="4520" from-port="2" to-layer="4522" to-port="0" /> <edge from-layer="4521" from-port="0" to-layer="4522" to-port="1" /> <edge from-layer="4522" from-port="2" to-layer="4523" to-port="0" /> <edge from-layer="4523" from-port="1" to-layer="4524" to-port="1" /> <edge from-layer="4524" from-port="2" to-layer="4526" to-port="0" /> <edge from-layer="4525" from-port="0" to-layer="4526" to-port="1" /> <edge from-layer="4526" from-port="2" to-layer="4527" to-port="0" /> <edge from-layer="4527" from-port="1" to-layer="4538" to-port="0" /> <edge from-layer="4528" from-port="0" to-layer="4529" to-port="0" /> <edge from-layer="4529" from-port="1" to-layer="4532" to-port="0" /> <edge from-layer="4530" from-port="0" to-layer="4531" to-port="0" /> <edge from-layer="4531" from-port="1" to-layer="4532" to-port="1" /> <edge from-layer="4532" from-port="2" to-layer="4534" to-port="0" /> <edge from-layer="4533" from-port="0" to-layer="4534" to-port="1" /> <edge from-layer="4534" from-port="2" to-layer="4536" to-port="0" /> <edge from-layer="4535" from-port="0" to-layer="4536" to-port="1" /> <edge from-layer="4536" from-port="2" to-layer="4537" to-port="0" /> <edge from-layer="4537" from-port="1" to-layer="4538" to-port="1" /> <edge from-layer="4538" from-port="2" to-layer="4540" to-port="0" /> <edge from-layer="4539" from-port="0" to-layer="4540" to-port="1" /> <edge from-layer="4540" from-port="2" to-layer="4541" to-port="1" /> <edge from-layer="4541" from-port="2" to-layer="4635" to-port="0" /> <edge from-layer="4541" from-port="2" to-layer="4543" to-port="0" /> <edge from-layer="4542" from-port="0" to-layer="4543" to-port="1" /> <edge from-layer="4543" from-port="2" to-layer="4545" to-port="0" /> <edge from-layer="4544" from-port="0" to-layer="4545" to-port="1" /> <edge from-layer="4545" from-port="2" to-layer="4547" to-port="0" /> <edge from-layer="4546" from-port="0" to-layer="4547" to-port="1" /> <edge from-layer="4547" from-port="2" to-layer="4558" to-port="0" /> <edge from-layer="4547" from-port="2" to-layer="4609" to-port="0" /> <edge from-layer="4547" from-port="2" to-layer="4584" to-port="0" /> <edge from-layer="4548" from-port="0" to-layer="4549" to-port="0" /> <edge from-layer="4549" from-port="1" to-layer="4552" to-port="0" /> <edge from-layer="4550" from-port="0" to-layer="4551" to-port="0" /> <edge from-layer="4551" from-port="1" to-layer="4552" to-port="1" /> <edge from-layer="4552" from-port="2" to-layer="4554" to-port="0" /> <edge from-layer="4553" from-port="0" to-layer="4554" to-port="1" /> <edge from-layer="4554" from-port="2" to-layer="4556" to-port="0" /> <edge from-layer="4555" from-port="0" to-layer="4556" to-port="1" /> <edge from-layer="4556" from-port="2" to-layer="4557" to-port="0" /> <edge from-layer="4557" from-port="1" to-layer="4558" to-port="1" /> <edge from-layer="4558" from-port="2" to-layer="4560" to-port="0" /> <edge from-layer="4559" from-port="0" to-layer="4560" to-port="1" /> <edge from-layer="4560" from-port="2" to-layer="4562" to-port="0" /> <edge from-layer="4561" from-port="0" to-layer="4562" to-port="1" /> <edge from-layer="4562" from-port="2" to-layer="4564" to-port="0" /> <edge from-layer="4563" from-port="0" to-layer="4564" to-port="1" /> <edge from-layer="4564" from-port="2" to-layer="4617" to-port="0" /> <edge from-layer="4565" from-port="0" to-layer="4570" to-port="0" /> <edge from-layer="4566" from-port="0" to-layer="4569" to-port="1" /> <edge from-layer="4567" from-port="0" to-layer="4569" to-port="2" /> <edge from-layer="4568" from-port="0" to-layer="4569" to-port="3" /> <edge from-layer="4569" from-port="4" to-layer="4570" to-port="1" /> <edge from-layer="4570" from-port="2" to-layer="4571" to-port="0" /> <edge from-layer="4571" from-port="1" to-layer="4573" to-port="0" /> <edge from-layer="4572" from-port="0" to-layer="4573" to-port="2" /> <edge from-layer="4573" from-port="3" to-layer="4589" to-port="0" /> <edge from-layer="4574" from-port="0" to-layer="4575" to-port="0" /> <edge from-layer="4575" from-port="1" to-layer="4578" to-port="0" /> <edge from-layer="4576" from-port="0" to-layer="4577" to-port="0" /> <edge from-layer="4577" from-port="1" to-layer="4578" to-port="1" /> <edge from-layer="4578" from-port="2" to-layer="4580" to-port="0" /> <edge from-layer="4579" from-port="0" to-layer="4580" to-port="1" /> <edge from-layer="4580" from-port="2" to-layer="4582" to-port="0" /> <edge from-layer="4581" from-port="0" to-layer="4582" to-port="1" /> <edge from-layer="4582" from-port="2" to-layer="4583" to-port="0" /> <edge from-layer="4583" from-port="1" to-layer="4584" to-port="1" /> <edge from-layer="4584" from-port="2" to-layer="4586" to-port="0" /> <edge from-layer="4585" from-port="0" to-layer="4586" to-port="1" /> <edge from-layer="4586" from-port="2" to-layer="4588" to-port="0" /> <edge from-layer="4587" from-port="0" to-layer="4588" to-port="1" /> <edge from-layer="4588" from-port="2" to-layer="4589" to-port="1" /> <edge from-layer="4589" from-port="2" to-layer="4936" to-port="0" /> <edge from-layer="4589" from-port="2" to-layer="4617" to-port="1" /> <edge from-layer="4590" from-port="0" to-layer="4595" to-port="0" /> <edge from-layer="4591" from-port="0" to-layer="4594" to-port="1" /> <edge from-layer="4592" from-port="0" to-layer="4594" to-port="2" /> <edge from-layer="4593" from-port="0" to-layer="4594" to-port="3" /> <edge from-layer="4594" from-port="4" to-layer="4595" to-port="1" /> <edge from-layer="4595" from-port="2" to-layer="4596" to-port="0" /> <edge from-layer="4596" from-port="1" to-layer="4598" to-port="0" /> <edge from-layer="4597" from-port="0" to-layer="4598" to-port="2" /> <edge from-layer="4598" from-port="3" to-layer="4616" to-port="0" /> <edge from-layer="4599" from-port="0" to-layer="4600" to-port="0" /> <edge from-layer="4600" from-port="1" to-layer="4603" to-port="0" /> <edge from-layer="4601" from-port="0" to-layer="4602" to-port="0" /> <edge from-layer="4602" from-port="1" to-layer="4603" to-port="1" /> <edge from-layer="4603" from-port="2" to-layer="4605" to-port="0" /> <edge from-layer="4604" from-port="0" to-layer="4605" to-port="1" /> <edge from-layer="4605" from-port="2" to-layer="4607" to-port="0" /> <edge from-layer="4606" from-port="0" to-layer="4607" to-port="1" /> <edge from-layer="4607" from-port="2" to-layer="4608" to-port="0" /> <edge from-layer="4608" from-port="1" to-layer="4609" to-port="1" /> <edge from-layer="4609" from-port="2" to-layer="4611" to-port="0" /> <edge from-layer="4610" from-port="0" to-layer="4611" to-port="1" /> <edge from-layer="4611" from-port="2" to-layer="4613" to-port="0" /> <edge from-layer="4612" from-port="0" to-layer="4613" to-port="1" /> <edge from-layer="4613" from-port="2" to-layer="4615" to-port="0" /> <edge from-layer="4614" from-port="0" to-layer="4615" to-port="1" /> <edge from-layer="4615" from-port="2" to-layer="4616" to-port="1" /> <edge from-layer="4616" from-port="2" to-layer="4935" to-port="0" /> <edge from-layer="4616" from-port="2" to-layer="4617" to-port="2" /> <edge from-layer="4617" from-port="4" to-layer="4619" to-port="0" /> <edge from-layer="4618" from-port="0" to-layer="4619" to-port="1" /> <edge from-layer="4619" from-port="2" to-layer="4621" to-port="0" /> <edge from-layer="4620" from-port="0" to-layer="4621" to-port="1" /> <edge from-layer="4621" from-port="2" to-layer="4632" to-port="0" /> <edge from-layer="4622" from-port="0" to-layer="4623" to-port="0" /> <edge from-layer="4623" from-port="1" to-layer="4626" to-port="0" /> <edge from-layer="4624" from-port="0" to-layer="4625" to-port="0" /> <edge from-layer="4625" from-port="1" to-layer="4626" to-port="1" /> <edge from-layer="4626" from-port="2" to-layer="4628" to-port="0" /> <edge from-layer="4627" from-port="0" to-layer="4628" to-port="1" /> <edge from-layer="4628" from-port="2" to-layer="4630" to-port="0" /> <edge from-layer="4629" from-port="0" to-layer="4630" to-port="1" /> <edge from-layer="4630" from-port="2" to-layer="4631" to-port="0" /> <edge from-layer="4631" from-port="1" to-layer="4632" to-port="1" /> <edge from-layer="4632" from-port="2" to-layer="4634" to-port="0" /> <edge from-layer="4633" from-port="0" to-layer="4634" to-port="1" /> <edge from-layer="4634" from-port="2" to-layer="4635" to-port="1" /> <edge from-layer="4635" from-port="2" to-layer="4637" to-port="0" /> <edge from-layer="4635" from-port="2" to-layer="4677" to-port="0" /> <edge from-layer="4636" from-port="0" to-layer="4637" to-port="1" /> <edge from-layer="4637" from-port="2" to-layer="4639" to-port="0" /> <edge from-layer="4638" from-port="0" to-layer="4639" to-port="1" /> <edge from-layer="4639" from-port="2" to-layer="4641" to-port="0" /> <edge from-layer="4640" from-port="0" to-layer="4641" to-port="1" /> <edge from-layer="4641" from-port="2" to-layer="4652" to-port="0" /> <edge from-layer="4642" from-port="0" to-layer="4643" to-port="0" /> <edge from-layer="4643" from-port="1" to-layer="4646" to-port="0" /> <edge from-layer="4644" from-port="0" to-layer="4645" to-port="0" /> <edge from-layer="4645" from-port="1" to-layer="4646" to-port="1" /> <edge from-layer="4646" from-port="2" to-layer="4648" to-port="0" /> <edge from-layer="4647" from-port="0" to-layer="4648" to-port="1" /> <edge from-layer="4648" from-port="2" to-layer="4650" to-port="0" /> <edge from-layer="4649" from-port="0" to-layer="4650" to-port="1" /> <edge from-layer="4650" from-port="2" to-layer="4651" to-port="0" /> <edge from-layer="4651" from-port="1" to-layer="4652" to-port="1" /> <edge from-layer="4652" from-port="2" to-layer="4654" to-port="0" /> <edge from-layer="4653" from-port="0" to-layer="4654" to-port="1" /> <edge from-layer="4654" from-port="2" to-layer="4656" to-port="0" /> <edge from-layer="4655" from-port="0" to-layer="4656" to-port="1" /> <edge from-layer="4656" from-port="2" to-layer="4658" to-port="0" /> <edge from-layer="4657" from-port="0" to-layer="4658" to-port="1" /> <edge from-layer="4658" from-port="2" to-layer="4659" to-port="0" /> <edge from-layer="4659" from-port="3" to-layer="4661" to-port="0" /> <edge from-layer="4660" from-port="0" to-layer="4661" to-port="1" /> <edge from-layer="4661" from-port="2" to-layer="4663" to-port="0" /> <edge from-layer="4662" from-port="0" to-layer="4663" to-port="1" /> <edge from-layer="4663" from-port="2" to-layer="4674" to-port="0" /> <edge from-layer="4664" from-port="0" to-layer="4665" to-port="0" /> <edge from-layer="4665" from-port="1" to-layer="4668" to-port="0" /> <edge from-layer="4666" from-port="0" to-layer="4667" to-port="0" /> <edge from-layer="4667" from-port="1" to-layer="4668" to-port="1" /> <edge from-layer="4668" from-port="2" to-layer="4670" to-port="0" /> <edge from-layer="4669" from-port="0" to-layer="4670" to-port="1" /> <edge from-layer="4670" from-port="2" to-layer="4672" to-port="0" /> <edge from-layer="4671" from-port="0" to-layer="4672" to-port="1" /> <edge from-layer="4672" from-port="2" to-layer="4673" to-port="0" /> <edge from-layer="4673" from-port="1" to-layer="4674" to-port="1" /> <edge from-layer="4674" from-port="2" to-layer="4676" to-port="0" /> <edge from-layer="4675" from-port="0" to-layer="4676" to-port="1" /> <edge from-layer="4676" from-port="2" to-layer="4677" to-port="1" /> <edge from-layer="4677" from-port="2" to-layer="4679" to-port="0" /> <edge from-layer="4677" from-port="2" to-layer="4711" to-port="0" /> <edge from-layer="4678" from-port="0" to-layer="4679" to-port="1" /> <edge from-layer="4679" from-port="2" to-layer="4681" to-port="0" /> <edge from-layer="4680" from-port="0" to-layer="4681" to-port="1" /> <edge from-layer="4681" from-port="2" to-layer="4683" to-port="0" /> <edge from-layer="4682" from-port="0" to-layer="4683" to-port="1" /> <edge from-layer="4683" from-port="2" to-layer="4694" to-port="0" /> <edge from-layer="4684" from-port="0" to-layer="4685" to-port="0" /> <edge from-layer="4685" from-port="1" to-layer="4688" to-port="0" /> <edge from-layer="4686" from-port="0" to-layer="4687" to-port="0" /> <edge from-layer="4687" from-port="1" to-layer="4688" to-port="1" /> <edge from-layer="4688" from-port="2" to-layer="4690" to-port="0" /> <edge from-layer="4689" from-port="0" to-layer="4690" to-port="1" /> <edge from-layer="4690" from-port="2" to-layer="4692" to-port="0" /> <edge from-layer="4691" from-port="0" to-layer="4692" to-port="1" /> <edge from-layer="4692" from-port="2" to-layer="4693" to-port="0" /> <edge from-layer="4693" from-port="1" to-layer="4694" to-port="1" /> <edge from-layer="4694" from-port="2" to-layer="4696" to-port="0" /> <edge from-layer="4695" from-port="0" to-layer="4696" to-port="1" /> <edge from-layer="4696" from-port="2" to-layer="4697" to-port="0" /> <edge from-layer="4697" from-port="1" to-layer="4708" to-port="0" /> <edge from-layer="4698" from-port="0" to-layer="4699" to-port="0" /> <edge from-layer="4699" from-port="1" to-layer="4702" to-port="0" /> <edge from-layer="4700" from-port="0" to-layer="4701" to-port="0" /> <edge from-layer="4701" from-port="1" to-layer="4702" to-port="1" /> <edge from-layer="4702" from-port="2" to-layer="4704" to-port="0" /> <edge from-layer="4703" from-port="0" to-layer="4704" to-port="1" /> <edge from-layer="4704" from-port="2" to-layer="4706" to-port="0" /> <edge from-layer="4705" from-port="0" to-layer="4706" to-port="1" /> <edge from-layer="4706" from-port="2" to-layer="4707" to-port="0" /> <edge from-layer="4707" from-port="1" to-layer="4708" to-port="1" /> <edge from-layer="4708" from-port="2" to-layer="4710" to-port="0" /> <edge from-layer="4709" from-port="0" to-layer="4710" to-port="1" /> <edge from-layer="4710" from-port="2" to-layer="4711" to-port="1" /> <edge from-layer="4711" from-port="2" to-layer="4713" to-port="0" /> <edge from-layer="4711" from-port="2" to-layer="4805" to-port="0" /> <edge from-layer="4712" from-port="0" to-layer="4713" to-port="1" /> <edge from-layer="4713" from-port="2" to-layer="4715" to-port="0" /> <edge from-layer="4714" from-port="0" to-layer="4715" to-port="1" /> <edge from-layer="4715" from-port="2" to-layer="4717" to-port="0" /> <edge from-layer="4716" from-port="0" to-layer="4717" to-port="1" /> <edge from-layer="4717" from-port="2" to-layer="4779" to-port="0" /> <edge from-layer="4717" from-port="2" to-layer="4728" to-port="0" /> <edge from-layer="4717" from-port="2" to-layer="4754" to-port="0" /> <edge from-layer="4718" from-port="0" to-layer="4719" to-port="0" /> <edge from-layer="4719" from-port="1" to-layer="4722" to-port="0" /> <edge from-layer="4720" from-port="0" to-layer="4721" to-port="0" /> <edge from-layer="4721" from-port="1" to-layer="4722" to-port="1" /> <edge from-layer="4722" from-port="2" to-layer="4724" to-port="0" /> <edge from-layer="4723" from-port="0" to-layer="4724" to-port="1" /> <edge from-layer="4724" from-port="2" to-layer="4726" to-port="0" /> <edge from-layer="4725" from-port="0" to-layer="4726" to-port="1" /> <edge from-layer="4726" from-port="2" to-layer="4727" to-port="0" /> <edge from-layer="4727" from-port="1" to-layer="4728" to-port="1" /> <edge from-layer="4728" from-port="2" to-layer="4730" to-port="0" /> <edge from-layer="4729" from-port="0" to-layer="4730" to-port="1" /> <edge from-layer="4730" from-port="2" to-layer="4732" to-port="0" /> <edge from-layer="4731" from-port="0" to-layer="4732" to-port="1" /> <edge from-layer="4732" from-port="2" to-layer="4734" to-port="0" /> <edge from-layer="4733" from-port="0" to-layer="4734" to-port="1" /> <edge from-layer="4734" from-port="2" to-layer="4787" to-port="0" /> <edge from-layer="4735" from-port="0" to-layer="4740" to-port="0" /> <edge from-layer="4736" from-port="0" to-layer="4739" to-port="1" /> <edge from-layer="4737" from-port="0" to-layer="4739" to-port="2" /> <edge from-layer="4738" from-port="0" to-layer="4739" to-port="3" /> <edge from-layer="4739" from-port="4" to-layer="4740" to-port="1" /> <edge from-layer="4740" from-port="2" to-layer="4741" to-port="0" /> <edge from-layer="4741" from-port="1" to-layer="4743" to-port="0" /> <edge from-layer="4742" from-port="0" to-layer="4743" to-port="2" /> <edge from-layer="4743" from-port="3" to-layer="4759" to-port="0" /> <edge from-layer="4744" from-port="0" to-layer="4745" to-port="0" /> <edge from-layer="4745" from-port="1" to-layer="4748" to-port="0" /> <edge from-layer="4746" from-port="0" to-layer="4747" to-port="0" /> <edge from-layer="4747" from-port="1" to-layer="4748" to-port="1" /> <edge from-layer="4748" from-port="2" to-layer="4750" to-port="0" /> <edge from-layer="4749" from-port="0" to-layer="4750" to-port="1" /> <edge from-layer="4750" from-port="2" to-layer="4752" to-port="0" /> <edge from-layer="4751" from-port="0" to-layer="4752" to-port="1" /> <edge from-layer="4752" from-port="2" to-layer="4753" to-port="0" /> <edge from-layer="4753" from-port="1" to-layer="4754" to-port="1" /> <edge from-layer="4754" from-port="2" to-layer="4756" to-port="0" /> <edge from-layer="4755" from-port="0" to-layer="4756" to-port="1" /> <edge from-layer="4756" from-port="2" to-layer="4758" to-port="0" /> <edge from-layer="4757" from-port="0" to-layer="4758" to-port="1" /> <edge from-layer="4758" from-port="2" to-layer="4759" to-port="1" /> <edge from-layer="4759" from-port="2" to-layer="4787" to-port="1" /> <edge from-layer="4759" from-port="2" to-layer="4934" to-port="0" /> <edge from-layer="4760" from-port="0" to-layer="4765" to-port="0" /> <edge from-layer="4761" from-port="0" to-layer="4764" to-port="1" /> <edge from-layer="4762" from-port="0" to-layer="4764" to-port="2" /> <edge from-layer="4763" from-port="0" to-layer="4764" to-port="3" /> <edge from-layer="4764" from-port="4" to-layer="4765" to-port="1" /> <edge from-layer="4765" from-port="2" to-layer="4766" to-port="0" /> <edge from-layer="4766" from-port="1" to-layer="4768" to-port="0" /> <edge from-layer="4767" from-port="0" to-layer="4768" to-port="2" /> <edge from-layer="4768" from-port="3" to-layer="4786" to-port="0" /> <edge from-layer="4769" from-port="0" to-layer="4770" to-port="0" /> <edge from-layer="4770" from-port="1" to-layer="4773" to-port="0" /> <edge from-layer="4771" from-port="0" to-layer="4772" to-port="0" /> <edge from-layer="4772" from-port="1" to-layer="4773" to-port="1" /> <edge from-layer="4773" from-port="2" to-layer="4775" to-port="0" /> <edge from-layer="4774" from-port="0" to-layer="4775" to-port="1" /> <edge from-layer="4775" from-port="2" to-layer="4777" to-port="0" /> <edge from-layer="4776" from-port="0" to-layer="4777" to-port="1" /> <edge from-layer="4777" from-port="2" to-layer="4778" to-port="0" /> <edge from-layer="4778" from-port="1" to-layer="4779" to-port="1" /> <edge from-layer="4779" from-port="2" to-layer="4781" to-port="0" /> <edge from-layer="4780" from-port="0" to-layer="4781" to-port="1" /> <edge from-layer="4781" from-port="2" to-layer="4783" to-port="0" /> <edge from-layer="4782" from-port="0" to-layer="4783" to-port="1" /> <edge from-layer="4783" from-port="2" to-layer="4785" to-port="0" /> <edge from-layer="4784" from-port="0" to-layer="4785" to-port="1" /> <edge from-layer="4785" from-port="2" to-layer="4786" to-port="1" /> <edge from-layer="4786" from-port="2" to-layer="4933" to-port="0" /> <edge from-layer="4786" from-port="2" to-layer="4787" to-port="2" /> <edge from-layer="4787" from-port="4" to-layer="4789" to-port="0" /> <edge from-layer="4788" from-port="0" to-layer="4789" to-port="1" /> <edge from-layer="4789" from-port="2" to-layer="4791" to-port="0" /> <edge from-layer="4790" from-port="0" to-layer="4791" to-port="1" /> <edge from-layer="4791" from-port="2" to-layer="4802" to-port="0" /> <edge from-layer="4792" from-port="0" to-layer="4793" to-port="0" /> <edge from-layer="4793" from-port="1" to-layer="4796" to-port="0" /> <edge from-layer="4794" from-port="0" to-layer="4795" to-port="0" /> <edge from-layer="4795" from-port="1" to-layer="4796" to-port="1" /> <edge from-layer="4796" from-port="2" to-layer="4798" to-port="0" /> <edge from-layer="4797" from-port="0" to-layer="4798" to-port="1" /> <edge from-layer="4798" from-port="2" to-layer="4800" to-port="0" /> <edge from-layer="4799" from-port="0" to-layer="4800" to-port="1" /> <edge from-layer="4800" from-port="2" to-layer="4801" to-port="0" /> <edge from-layer="4801" from-port="1" to-layer="4802" to-port="1" /> <edge from-layer="4802" from-port="2" to-layer="4804" to-port="0" /> <edge from-layer="4803" from-port="0" to-layer="4804" to-port="1" /> <edge from-layer="4804" from-port="2" to-layer="4805" to-port="1" /> <edge from-layer="4805" from-port="2" to-layer="4807" to-port="0" /> <edge from-layer="4805" from-port="2" to-layer="4847" to-port="0" /> <edge from-layer="4806" from-port="0" to-layer="4807" to-port="1" /> <edge from-layer="4807" from-port="2" to-layer="4809" to-port="0" /> <edge from-layer="4808" from-port="0" to-layer="4809" to-port="1" /> <edge from-layer="4809" from-port="2" to-layer="4811" to-port="0" /> <edge from-layer="4810" from-port="0" to-layer="4811" to-port="1" /> <edge from-layer="4811" from-port="2" to-layer="4822" to-port="0" /> <edge from-layer="4812" from-port="0" to-layer="4813" to-port="0" /> <edge from-layer="4813" from-port="1" to-layer="4816" to-port="0" /> <edge from-layer="4814" from-port="0" to-layer="4815" to-port="0" /> <edge from-layer="4815" from-port="1" to-layer="4816" to-port="1" /> <edge from-layer="4816" from-port="2" to-layer="4818" to-port="0" /> <edge from-layer="4817" from-port="0" to-layer="4818" to-port="1" /> <edge from-layer="4818" from-port="2" to-layer="4820" to-port="0" /> <edge from-layer="4819" from-port="0" to-layer="4820" to-port="1" /> <edge from-layer="4820" from-port="2" to-layer="4821" to-port="0" /> <edge from-layer="4821" from-port="1" to-layer="4822" to-port="1" /> <edge from-layer="4822" from-port="2" to-layer="4824" to-port="0" /> <edge from-layer="4823" from-port="0" to-layer="4824" to-port="1" /> <edge from-layer="4824" from-port="2" to-layer="4826" to-port="0" /> <edge from-layer="4825" from-port="0" to-layer="4826" to-port="1" /> <edge from-layer="4826" from-port="2" to-layer="4828" to-port="0" /> <edge from-layer="4827" from-port="0" to-layer="4828" to-port="1" /> <edge from-layer="4828" from-port="2" to-layer="4829" to-port="0" /> <edge from-layer="4829" from-port="3" to-layer="4831" to-port="0" /> <edge from-layer="4830" from-port="0" to-layer="4831" to-port="1" /> <edge from-layer="4831" from-port="2" to-layer="4833" to-port="0" /> <edge from-layer="4832" from-port="0" to-layer="4833" to-port="1" /> <edge from-layer="4833" from-port="2" to-layer="4844" to-port="0" /> <edge from-layer="4834" from-port="0" to-layer="4835" to-port="0" /> <edge from-layer="4835" from-port="1" to-layer="4838" to-port="0" /> <edge from-layer="4836" from-port="0" to-layer="4837" to-port="0" /> <edge from-layer="4837" from-port="1" to-layer="4838" to-port="1" /> <edge from-layer="4838" from-port="2" to-layer="4840" to-port="0" /> <edge from-layer="4839" from-port="0" to-layer="4840" to-port="1" /> <edge from-layer="4840" from-port="2" to-layer="4842" to-port="0" /> <edge from-layer="4841" from-port="0" to-layer="4842" to-port="1" /> <edge from-layer="4842" from-port="2" to-layer="4843" to-port="0" /> <edge from-layer="4843" from-port="1" to-layer="4844" to-port="1" /> <edge from-layer="4844" from-port="2" to-layer="4846" to-port="0" /> <edge from-layer="4845" from-port="0" to-layer="4846" to-port="1" /> <edge from-layer="4846" from-port="2" to-layer="4847" to-port="1" /> <edge from-layer="4847" from-port="2" to-layer="4849" to-port="0" /> <edge from-layer="4847" from-port="2" to-layer="4881" to-port="0" /> <edge from-layer="4848" from-port="0" to-layer="4849" to-port="1" /> <edge from-layer="4849" from-port="2" to-layer="4851" to-port="0" /> <edge from-layer="4850" from-port="0" to-layer="4851" to-port="1" /> <edge from-layer="4851" from-port="2" to-layer="4853" to-port="0" /> <edge from-layer="4852" from-port="0" to-layer="4853" to-port="1" /> <edge from-layer="4853" from-port="2" to-layer="4864" to-port="0" /> <edge from-layer="4854" from-port="0" to-layer="4855" to-port="0" /> <edge from-layer="4855" from-port="1" to-layer="4858" to-port="0" /> <edge from-layer="4856" from-port="0" to-layer="4857" to-port="0" /> <edge from-layer="4857" from-port="1" to-layer="4858" to-port="1" /> <edge from-layer="4858" from-port="2" to-layer="4860" to-port="0" /> <edge from-layer="4859" from-port="0" to-layer="4860" to-port="1" /> <edge from-layer="4860" from-port="2" to-layer="4862" to-port="0" /> <edge from-layer="4861" from-port="0" to-layer="4862" to-port="1" /> <edge from-layer="4862" from-port="2" to-layer="4863" to-port="0" /> <edge from-layer="4863" from-port="1" to-layer="4864" to-port="1" /> <edge from-layer="4864" from-port="2" to-layer="4866" to-port="0" /> <edge from-layer="4865" from-port="0" to-layer="4866" to-port="1" /> <edge from-layer="4866" from-port="2" to-layer="4867" to-port="0" /> <edge from-layer="4867" from-port="1" to-layer="4878" to-port="0" /> <edge from-layer="4868" from-port="0" to-layer="4869" to-port="0" /> <edge from-layer="4869" from-port="1" to-layer="4872" to-port="0" /> <edge from-layer="4870" from-port="0" to-layer="4871" to-port="0" /> <edge from-layer="4871" from-port="1" to-layer="4872" to-port="1" /> <edge from-layer="4872" from-port="2" to-layer="4874" to-port="0" /> <edge from-layer="4873" from-port="0" to-layer="4874" to-port="1" /> <edge from-layer="4874" from-port="2" to-layer="4876" to-port="0" /> <edge from-layer="4875" from-port="0" to-layer="4876" to-port="1" /> <edge from-layer="4876" from-port="2" to-layer="4877" to-port="0" /> <edge from-layer="4877" from-port="1" to-layer="4878" to-port="1" /> <edge from-layer="4878" from-port="2" to-layer="4880" to-port="0" /> <edge from-layer="4879" from-port="0" to-layer="4880" to-port="1" /> <edge from-layer="4880" from-port="2" to-layer="4881" to-port="1" /> <edge from-layer="4881" from-port="2" to-layer="4883" to-port="0" /> <edge from-layer="4881" from-port="2" to-layer="5000" to-port="0" /> <edge from-layer="4882" from-port="0" to-layer="4883" to-port="1" /> <edge from-layer="4883" from-port="2" to-layer="4885" to-port="0" /> <edge from-layer="4884" from-port="0" to-layer="4885" to-port="1" /> <edge from-layer="4885" from-port="2" to-layer="4887" to-port="0" /> <edge from-layer="4886" from-port="0" to-layer="4887" to-port="1" /> <edge from-layer="4887" from-port="2" to-layer="4926" to-port="0" /> <edge from-layer="4887" from-port="2" to-layer="4975" to-port="0" /> <edge from-layer="4887" from-port="2" to-layer="4898" to-port="0" /> <edge from-layer="4888" from-port="0" to-layer="4889" to-port="0" /> <edge from-layer="4889" from-port="1" to-layer="4892" to-port="0" /> <edge from-layer="4890" from-port="0" to-layer="4891" to-port="0" /> <edge from-layer="4891" from-port="1" to-layer="4892" to-port="1" /> <edge from-layer="4892" from-port="2" to-layer="4894" to-port="0" /> <edge from-layer="4893" from-port="0" to-layer="4894" to-port="1" /> <edge from-layer="4894" from-port="2" to-layer="4896" to-port="0" /> <edge from-layer="4895" from-port="0" to-layer="4896" to-port="1" /> <edge from-layer="4896" from-port="2" to-layer="4897" to-port="0" /> <edge from-layer="4897" from-port="1" to-layer="4898" to-port="1" /> <edge from-layer="4898" from-port="2" to-layer="4900" to-port="0" /> <edge from-layer="4899" from-port="0" to-layer="4900" to-port="1" /> <edge from-layer="4900" from-port="2" to-layer="4902" to-port="0" /> <edge from-layer="4901" from-port="0" to-layer="4902" to-port="1" /> <edge from-layer="4902" from-port="2" to-layer="4904" to-port="0" /> <edge from-layer="4903" from-port="0" to-layer="4904" to-port="1" /> <edge from-layer="4904" from-port="2" to-layer="4905" to-port="1" /> <edge from-layer="4905" from-port="2" to-layer="4982" to-port="2" /> <edge from-layer="4905" from-port="2" to-layer="4906" to-port="0" /> <edge from-layer="4907" from-port="0" to-layer="4912" to-port="0" /> <edge from-layer="4908" from-port="0" to-layer="4911" to-port="1" /> <edge from-layer="4909" from-port="0" to-layer="4911" to-port="2" /> <edge from-layer="4910" from-port="0" to-layer="4911" to-port="3" /> <edge from-layer="4911" from-port="4" to-layer="4912" to-port="1" /> <edge from-layer="4912" from-port="2" to-layer="4913" to-port="0" /> <edge from-layer="4913" from-port="1" to-layer="4915" to-port="0" /> <edge from-layer="4914" from-port="0" to-layer="4915" to-port="2" /> <edge from-layer="4915" from-port="3" to-layer="4931" to-port="0" /> <edge from-layer="4916" from-port="0" to-layer="4917" to-port="0" /> <edge from-layer="4917" from-port="1" to-layer="4920" to-port="0" /> <edge from-layer="4918" from-port="0" to-layer="4919" to-port="0" /> <edge from-layer="4919" from-port="1" to-layer="4920" to-port="1" /> <edge from-layer="4920" from-port="2" to-layer="4922" to-port="0" /> <edge from-layer="4921" from-port="0" to-layer="4922" to-port="1" /> <edge from-layer="4922" from-port="2" to-layer="4924" to-port="0" /> <edge from-layer="4923" from-port="0" to-layer="4924" to-port="1" /> <edge from-layer="4924" from-port="2" to-layer="4925" to-port="0" /> <edge from-layer="4925" from-port="1" to-layer="4926" to-port="1" /> <edge from-layer="4926" from-port="2" to-layer="4928" to-port="0" /> <edge from-layer="4927" from-port="0" to-layer="4928" to-port="1" /> <edge from-layer="4928" from-port="2" to-layer="4930" to-port="0" /> <edge from-layer="4929" from-port="0" to-layer="4930" to-port="1" /> <edge from-layer="4930" from-port="2" to-layer="4931" to-port="1" /> <edge from-layer="4931" from-port="2" to-layer="4982" to-port="1" /> <edge from-layer="4931" from-port="2" to-layer="4932" to-port="0" /> <edge from-layer="4965" from-port="0" to-layer="4966" to-port="0" /> <edge from-layer="4966" from-port="1" to-layer="4969" to-port="0" /> <edge from-layer="4967" from-port="0" to-layer="4968" to-port="0" /> <edge from-layer="4968" from-port="1" to-layer="4969" to-port="1" /> <edge from-layer="4969" from-port="2" to-layer="4971" to-port="0" /> <edge from-layer="4970" from-port="0" to-layer="4971" to-port="1" /> <edge from-layer="4971" from-port="2" to-layer="4973" to-port="0" /> <edge from-layer="4972" from-port="0" to-layer="4973" to-port="1" /> <edge from-layer="4973" from-port="2" to-layer="4974" to-port="0" /> <edge from-layer="4974" from-port="1" to-layer="4975" to-port="1" /> <edge from-layer="4975" from-port="2" to-layer="4977" to-port="0" /> <edge from-layer="4976" from-port="0" to-layer="4977" to-port="1" /> <edge from-layer="4977" from-port="2" to-layer="4979" to-port="0" /> <edge from-layer="4978" from-port="0" to-layer="4979" to-port="1" /> <edge from-layer="4979" from-port="2" to-layer="4981" to-port="0" /> <edge from-layer="4980" from-port="0" to-layer="4981" to-port="1" /> <edge from-layer="4981" from-port="2" to-layer="4982" to-port="0" /> <edge from-layer="4982" from-port="4" to-layer="4984" to-port="0" /> <edge from-layer="4983" from-port="0" to-layer="4984" to-port="1" /> <edge from-layer="4984" from-port="2" to-layer="4986" to-port="0" /> <edge from-layer="4985" from-port="0" to-layer="4986" to-port="1" /> <edge from-layer="4986" from-port="2" to-layer="4997" to-port="0" /> <edge from-layer="4987" from-port="0" to-layer="4988" to-port="0" /> <edge from-layer="4988" from-port="1" to-layer="4991" to-port="0" /> <edge from-layer="4989" from-port="0" to-layer="4990" to-port="0" /> <edge from-layer="4990" from-port="1" to-layer="4991" to-port="1" /> <edge from-layer="4991" from-port="2" to-layer="4993" to-port="0" /> <edge from-layer="4992" from-port="0" to-layer="4993" to-port="1" /> <edge from-layer="4993" from-port="2" to-layer="4995" to-port="0" /> <edge from-layer="4994" from-port="0" to-layer="4995" to-port="1" /> <edge from-layer="4995" from-port="2" to-layer="4996" to-port="0" /> <edge from-layer="4996" from-port="1" to-layer="4997" to-port="1" /> <edge from-layer="4997" from-port="2" to-layer="4999" to-port="0" /> <edge from-layer="4998" from-port="0" to-layer="4999" to-port="1" /> <edge from-layer="4999" from-port="2" to-layer="5000" to-port="1" /> <edge from-layer="5000" from-port="2" to-layer="5042" to-port="0" /> <edge from-layer="5000" from-port="2" to-layer="5002" to-port="0" /> <edge from-layer="5001" from-port="0" to-layer="5002" to-port="1" /> <edge from-layer="5002" from-port="2" to-layer="5004" to-port="0" /> <edge from-layer="5003" from-port="0" to-layer="5004" to-port="1" /> <edge from-layer="5004" from-port="2" to-layer="5006" to-port="0" /> <edge from-layer="5005" from-port="0" to-layer="5006" to-port="1" /> <edge from-layer="5006" from-port="2" to-layer="5017" to-port="0" /> <edge from-layer="5007" from-port="0" to-layer="5008" to-port="0" /> <edge from-layer="5008" from-port="1" to-layer="5011" to-port="0" /> <edge from-layer="5009" from-port="0" to-layer="5010" to-port="0" /> <edge from-layer="5010" from-port="1" to-layer="5011" to-port="1" /> <edge from-layer="5011" from-port="2" to-layer="5013" to-port="0" /> <edge from-layer="5012" from-port="0" to-layer="5013" to-port="1" /> <edge from-layer="5013" from-port="2" to-layer="5015" to-port="0" /> <edge from-layer="5014" from-port="0" to-layer="5015" to-port="1" /> <edge from-layer="5015" from-port="2" to-layer="5016" to-port="0" /> <edge from-layer="5016" from-port="1" to-layer="5017" to-port="1" /> <edge from-layer="5017" from-port="2" to-layer="5019" to-port="0" /> <edge from-layer="5018" from-port="0" to-layer="5019" to-port="1" /> <edge from-layer="5019" from-port="2" to-layer="5021" to-port="0" /> <edge from-layer="5020" from-port="0" to-layer="5021" to-port="1" /> <edge from-layer="5021" from-port="2" to-layer="5023" to-port="0" /> <edge from-layer="5022" from-port="0" to-layer="5023" to-port="1" /> <edge from-layer="5023" from-port="2" to-layer="5024" to-port="0" /> <edge from-layer="5024" from-port="3" to-layer="5026" to-port="0" /> <edge from-layer="5025" from-port="0" to-layer="5026" to-port="1" /> <edge from-layer="5026" from-port="2" to-layer="5028" to-port="0" /> <edge from-layer="5027" from-port="0" to-layer="5028" to-port="1" /> <edge from-layer="5028" from-port="2" to-layer="5039" to-port="0" /> <edge from-layer="5029" from-port="0" to-layer="5030" to-port="0" /> <edge from-layer="5030" from-port="1" to-layer="5033" to-port="0" /> <edge from-layer="5031" from-port="0" to-layer="5032" to-port="0" /> <edge from-layer="5032" from-port="1" to-layer="5033" to-port="1" /> <edge from-layer="5033" from-port="2" to-layer="5035" to-port="0" /> <edge from-layer="5034" from-port="0" to-layer="5035" to-port="1" /> <edge from-layer="5035" from-port="2" to-layer="5037" to-port="0" /> <edge from-layer="5036" from-port="0" to-layer="5037" to-port="1" /> <edge from-layer="5037" from-port="2" to-layer="5038" to-port="0" /> <edge from-layer="5038" from-port="1" to-layer="5039" to-port="1" /> <edge from-layer="5039" from-port="2" to-layer="5041" to-port="0" /> <edge from-layer="5040" from-port="0" to-layer="5041" to-port="1" /> <edge from-layer="5041" from-port="2" to-layer="5042" to-port="1" /> <edge from-layer="5042" from-port="2" to-layer="5076" to-port="0" /> <edge from-layer="5042" from-port="2" to-layer="5044" to-port="0" /> <edge from-layer="5043" from-port="0" to-layer="5044" to-port="1" /> <edge from-layer="5044" from-port="2" to-layer="5046" to-port="0" /> <edge from-layer="5045" from-port="0" to-layer="5046" to-port="1" /> <edge from-layer="5046" from-port="2" to-layer="5048" to-port="0" /> <edge from-layer="5047" from-port="0" to-layer="5048" to-port="1" /> <edge from-layer="5048" from-port="2" to-layer="5059" to-port="0" /> <edge from-layer="5049" from-port="0" to-layer="5050" to-port="0" /> <edge from-layer="5050" from-port="1" to-layer="5053" to-port="0" /> <edge from-layer="5051" from-port="0" to-layer="5052" to-port="0" /> <edge from-layer="5052" from-port="1" to-layer="5053" to-port="1" /> <edge from-layer="5053" from-port="2" to-layer="5055" to-port="0" /> <edge from-layer="5054" from-port="0" to-layer="5055" to-port="1" /> <edge from-layer="5055" from-port="2" to-layer="5057" to-port="0" /> <edge from-layer="5056" from-port="0" to-layer="5057" to-port="1" /> <edge from-layer="5057" from-port="2" to-layer="5058" to-port="0" /> <edge from-layer="5058" from-port="1" to-layer="5059" to-port="1" /> <edge from-layer="5059" from-port="2" to-layer="5061" to-port="0" /> <edge from-layer="5060" from-port="0" to-layer="5061" to-port="1" /> <edge from-layer="5061" from-port="2" to-layer="5062" to-port="0" /> <edge from-layer="5062" from-port="1" to-layer="5073" to-port="0" /> <edge from-layer="5063" from-port="0" to-layer="5064" to-port="0" /> <edge from-layer="5064" from-port="1" to-layer="5067" to-port="0" /> <edge from-layer="5065" from-port="0" to-layer="5066" to-port="0" /> <edge from-layer="5066" from-port="1" to-layer="5067" to-port="1" /> <edge from-layer="5067" from-port="2" to-layer="5069" to-port="0" /> <edge from-layer="5068" from-port="0" to-layer="5069" to-port="1" /> <edge from-layer="5069" from-port="2" to-layer="5071" to-port="0" /> <edge from-layer="5070" from-port="0" to-layer="5071" to-port="1" /> <edge from-layer="5071" from-port="2" to-layer="5072" to-port="0" /> <edge from-layer="5072" from-port="1" to-layer="5073" to-port="1" /> <edge from-layer="5073" from-port="2" to-layer="5075" to-port="0" /> <edge from-layer="5074" from-port="0" to-layer="5075" to-port="1" /> <edge from-layer="5075" from-port="2" to-layer="5076" to-port="1" /> <edge from-layer="5076" from-port="2" to-layer="5078" to-port="0" /> <edge from-layer="5077" from-port="0" to-layer="5078" to-port="1" /> <edge from-layer="5078" from-port="2" to-layer="5080" to-port="0" /> <edge from-layer="5079" from-port="0" to-layer="5080" to-port="1" /> <edge from-layer="5080" from-port="2" to-layer="5082" to-port="0" /> <edge from-layer="5081" from-port="0" to-layer="5082" to-port="1" /> <edge from-layer="5082" from-port="2" to-layer="5083" to-port="0" /> <edge from-layer="5083" from-port="2" to-layer="5084" to-port="0" /> </edges> <rt_info> <Runtime_version value="2025.2.0-19120-87425bc78ca-releases/2025/2" /> <conversion_parameters> <framework value="pytorch" /> <is_python_object value="True" /> </conversion_parameters> <nncf> <friendly_names_were_updated value="True" /> <weight_compression> <advanced_parameters value="{'statistics_path': None, 'awq_params': {'subset_size': 32, 'percent_to_apply': 0.002, 'alpha_min': 0.0, 'alpha_max': 1.0, 'steps': 100}, 'scale_estimation_params': {'subset_size': 64, 'initial_steps': 5, 'scale_steps': 5, 'weight_penalty': -1.0}, 'gptq_params': {'damp_percent': 0.1, 'block_size': 128, 'subset_size': 128}, 'lora_correction_params': {'adapter_rank': 8, 'num_iterations': 3, 'apply_regularization': True, 'subset_size': 128, 'use_int8_adapters': True}, 'lora_adapter_rank': 256}" /> <all_layers value="False" /> <awq value="False" /> <backup_mode value="int8_asym" /> <compression_format value="dequantize" /> <gptq value="False" /> <group_size value="128" /> <ignored_scope value="[]" /> <lora_correction value="False" /> <mode value="int4_asym" /> <ratio value="1.0" /> <scale_estimation value="False" /> <sensitivity_metric value="weight_quantization_error" /> </weight_compression> </nncf> <optimum> <nncf_version value="2.16.0" /> <optimum_intel_version value="1.24.0.dev0+08e3008" /> <optimum_version value="1.25.3" /> <pytorch_version value="2.7.0+cpu" /> <transformers_version value="4.51.3" /> </optimum> <runtime_options> <ACTIVATIONS_SCALE_FACTOR value="8.0" /> </runtime_options> </rt_info> </net>